diff --git a/CommonLib/CommonLib.vcxproj b/CommonLib/CommonLib.vcxproj
index 321cf13..8836c8c 100644
--- a/CommonLib/CommonLib.vcxproj
+++ b/CommonLib/CommonLib.vcxproj
@@ -112,6 +112,7 @@
     </Text>
   </ItemGroup>
   <ItemGroup>
+    <ClInclude Include="kthread.h" />
     <ClInclude Include="matlab_io.h" />
     <ClInclude Include="thread_pool.h" />
   </ItemGroup>
diff --git a/CommonLib/CommonLib.vcxproj.filters b/CommonLib/CommonLib.vcxproj.filters
index 20334ba..7d4df5e 100644
--- a/CommonLib/CommonLib.vcxproj.filters
+++ b/CommonLib/CommonLib.vcxproj.filters
@@ -28,6 +28,9 @@
     <ClInclude Include="thread_pool.h">
       <Filter>Header Files</Filter>
     </ClInclude>
+    <ClInclude Include="kthread.h">
+      <Filter>Header Files</Filter>
+    </ClInclude>
   </ItemGroup>
   <ItemGroup>
     <ClCompile Include="matlab_io.cpp">
diff --git a/CommonLib/kthread.h b/CommonLib/kthread.h
new file mode 100644
index 0000000..52abb5d
--- /dev/null
+++ b/CommonLib/kthread.h
@@ -0,0 +1,145 @@
+#ifndef KTHREAD_H
+#define KTHREAD_H
+#include <stdlib.h>
+#include <limits.h>
+#include <thread>
+#include <vector>
+#include <atomic>
+
+using std::atomic;
+using std::thread;
+using std::vector;
+
+/************
+ * kt_for() *
+ ************/
+
+template <typename T>
+using FuncType3Arg = void (*)(vector<T>&, long, int);
+
+template <typename T>
+using FuncType1Arg = void (*)(T&);
+
+template <class T>
+struct kt_for_t;
+
+template <typename T>
+struct ktf_worker_t
+{
+    kt_for_t<T>* t;
+    atomic<long> i;
+};
+
+template <typename T>
+struct kt_for_t
+{
+    int n_threads;
+    long n;
+
+    ktf_worker_t<T>* w;
+    FuncType1Arg<T> func1Arg;
+    FuncType3Arg<T> func3Arg;
+    vector<T>* data;
+};
+
+template <class T>
+static inline long steal_work(kt_for_t<T>* t)
+{
+    int i, min_i = -1;
+    long k, min = LONG_MAX;
+    for (i = 0; i < t->n_threads; ++i)
+        if (min > t->w[i].i)
+            min = t->w[i].i, min_i = i;
+    k = t->w[min_i].i.fetch_add(t->n_threads);
+    return k >= t->n ? -1 : k;
+}
+
+template <class T>
+static void ktf_worker_1_arg(void* data)
+{
+    ktf_worker_t<T>* w = (ktf_worker_t<T> *)data;
+    long i;
+
+    for (;;)
+    {
+        i = w->i.fetch_add(w->t->n_threads);
+        if (i >= w->t->n)
+            break;
+        w->t->func1Arg(( * w->t->data)[i]);
+    }
+    while ((i = steal_work<T>(w->t)) >= 0)
+        w->t->func1Arg((*w->t->data)[i]);
+}
+
+template <class T>
+static void ktf_worker_3_arg(void* data)
+{
+    ktf_worker_t<T>* w = (ktf_worker_t<T> *)data;
+    long i;
+
+    for (;;)
+    {
+        i = w->i.fetch_add(w->t->n_threads);
+        if (i >= w->t->n)
+            break;
+        w->t->func3Arg(*w->t->data, i, w - w->t->w);
+    }
+    while ((i = steal_work<T>(w->t)) >= 0)
+        w->t->func3Arg(*w->t->data, i, w - w->t->w);
+}
+
+template <typename T>
+void kt_for(int n_threads, FuncType3Arg<T> func, vector<T>& vData)
+{
+    const long n = (long)vData.size();
+    if (n_threads > 1)
+    {
+        int i;
+        kt_for_t<T> t;
+        t.func3Arg = func, t.data = &vData, t.n_threads = n_threads, t.n = n;
+        t.w = (ktf_worker_t<T> *)alloca(n_threads * sizeof(ktf_worker_t<T>));
+        vector<thread> vThread;
+
+        for (i = 0; i < n_threads; ++i)
+            t.w[i].t = &t, t.w[i].i.store(i);
+        for (i = 0; i < n_threads; ++i)
+            vThread.push_back(thread(ktf_worker_3_arg<T>, &t.w[i]));
+        for (i = 0; i < n_threads; ++i)
+            vThread[i].join();
+    }
+    else
+    {
+        long j;
+        for (j = 0; j < n; ++j)
+            func(vData, j, 0);
+    }
+}
+
+template <typename T>
+void kt_for(int n_threads, FuncType1Arg<T> func, vector<T>& vData)
+{
+    const long n = (long)vData.size();
+    if (n_threads > 1)
+    {
+        int i;
+        kt_for_t<T> t;
+        t.func1Arg = func, t.data = &vData, t.n_threads = n_threads, t.n = n;
+        t.w = (ktf_worker_t<T> *)alloca(n_threads * sizeof(ktf_worker_t<T>));
+        vector<thread> vThread;
+
+        for (i = 0; i < n_threads; ++i)
+            t.w[i].t = &t, t.w[i].i.store(i);
+        for (i = 0; i < n_threads; ++i)
+            vThread.push_back(thread(ktf_worker_1_arg<T>, &t.w[i]));
+        for (i = 0; i < n_threads; ++i)
+            vThread[i].join();
+    }
+    else
+    {
+        long j;
+        for (j = 0; j < n; ++j)
+            func(vData[j]);
+    }
+}
+
+#endif
diff --git a/CppRun/calc_entropy.cpp b/CppRun/calc_entropy.cpp
index ea85df5..4e507c6 100644
--- a/CppRun/calc_entropy.cpp
+++ b/CppRun/calc_entropy.cpp
@@ -33,6 +33,7 @@
 #include "common.h"
 #include "CommonLib/thread_pool.h"
 #include "CommonLib/matlab_io.h"
+#include "CommonLib/kthread.h"
 using namespace std;
 using std::cout;
 using std::vector;
@@ -106,7 +107,6 @@ bool ReadInfoFromMat(const string & filePath, vector<vector<string> >&vvDs, vect
 	// ¶ÁÈ¡ds×Ö·û´®
 	pMxArray = mxGetField(pMxG, 0, firstChildName.c_str()); // ds
 	OUTER_FOR_BEGIN
-		// cout << childRowNum << '\t' << childColNum << endl;
 		vvDs.push_back(vector<string>());
 		vvDs.back().resize(childRowNum * childColNum);
 		INNTER_FOR_BEGIN
@@ -144,7 +144,7 @@ struct ThreadParam { // 
 	fs::path outFilePath;
 	vector<unordered_set<string> >* pvusWord;
 };
-void ThreadProcessData(const ThreadParam& param) {
+void ThreadProcessData(ThreadParam& param) {
 	const fs::path& matFilePath = param.matFilePath;
 	const fs::path& outFilePath = param.outFilePath;
 	vector <unordered_set<string> >& vusWord = *param.pvusWord;
@@ -156,11 +156,8 @@ void ThreadProcessData(const ThreadParam& param) {
 	vector<vector<string> > vvDs; // Ã¿¸öÖªÊ¶¿ÅÁ£µÄds¾ØÕó£¨´Ê»ã¾ØÕó£©
 	vector<vector<double> > vvFr; // ´Ê»ã¶ÔÓ¦µÄÆµÂÊ
 
-	// cout << matFilePath.string() << endl;
 	// ¶ÁÈ¡G½á¹¹ÌåÖÐµÄdsºÍfrÐÅÏ¢
 	ReadInfoFromMat(matFilePath.string(), vvDs, vvFr);
-	// res.vvEntropy.push_back(vvFr[0]);
-	// cout << vvDs.size() << '\t' << vvDs[0].size() << endl;
 	const int numLiterature = vusWord.size(); // pubmed ÎÄ¼þÖÐ°üº¬µÄÎÄÏ×ÊýÁ¿
 	const int numGroup = vvDs.size(); // ds°üº¬µÄ×éÊý
 	hs.resize(numGroup * numLiterature);
@@ -176,9 +173,6 @@ void ThreadProcessData(const ThreadParam& param) {
 			for (int j = 0; j < numWord; ++j) {
 				if (vusWord[i].find(vDs[j]) != vusWord[i].end()) { // ÕâÒ»×éµ¥´ÊÖÐµÄjË÷ÒýÎ»ÖÃµÄµ¥´ÊÔÚµÚi¸öÎÄÏ×ÖÐ³öÏÖ¹ý
 					vX[i][j] = 1;
-					if (groupIdx == 1 && i == 2) {
-						// cout << matFilePath.string() << '\t' << j+1 << '\t' << vDs[j] << endl;
-					}
 				}
 			}
 		}
@@ -216,8 +210,8 @@ void ThreadProcessData(const ThreadParam& param) {
 	}
 	/* ½«½á¹û£¨hsºÍhr£©Ð´ÈëÃ¿¸öÖªÊ¶¿ÅÁ£µÄÄ¿Â¼ÄÚ */
 	MATFile* pMatFile = matOpen(outFilePath.string().c_str(), "w");
-	SaveMtxDouble(hs.data(), pMatFile, "hs1", numGroup, numLiterature);
-	SaveMtxDouble(hr.data(), pMatFile, "hr1", numLiterature, numGroup);
+	SaveMtxDouble(hs.data(), pMatFile, "hs", numGroup, numLiterature);
+	SaveMtxDouble(hr.data(), pMatFile, "hr", numLiterature, numGroup);
 	matClose(pMatFile);
 }
 
@@ -228,7 +222,7 @@ void CalcEntropy(int argc, const char** argv) {
 	// 1. ÖªÊ¶¿ÅÁ£µÄ¸¸Ä¿Â¼Ãû³Æ
 	// 2. °üº¬¸ßÆµ´Ê»ãÐÅÏ¢µÄmatÎÄ¼þµÄºó×º
 	// 3. °üº¬´¦ÀíºóµÄpubmedÎÄÏ×ÐÅÏ¢µÄmatÎÄ¼þÂ·¾¶
-	// 4. ´æ·ÅÊä³ö½á¹ûµÄmatÎÄ¼þµÄºó×º£¨Ã¿¸öÖªÊ¶¿ÅÁ£Ä¿Â¼ÖÐÉú³ÉÒ»¸ö½á¹ûÎÄ¼þ£©
+	// 4. ´æ·ÅÊä³ö½á¹ûµÄmatÎÄ¼þÃû£¨Ã¿¸öÖªÊ¶¿ÅÁ£Ä¿Â¼ÖÐÉú³ÉÒ»¸ö½á¹ûÎÄ¼þ£©
 	// 5. Ïß³ÌÊýÁ¿(¿ÉÑ¡)
 	if (argc < 5) {
 		cout << "This program should take at least 4 arguments(1.parrent Dir; 2. mat file suffix; 3. pubmed mat file; 4. out mat filename; [5. thread number]; [6. word out mat filepath])!" << endl;
@@ -241,7 +235,6 @@ void CalcEntropy(int argc, const char** argv) {
 	int numThread = 1;
 	if (argc >= 5) numThread = atoi(argv[5]);
 	if (numThread < 1) numThread = 1;
-	// cout << "thread num: " << numThread << endl;
 
 	/* ¶ÁÈë´¦ÀíºóµÄpubmedÎÄÏ×ÐÅÏ¢µÄmatÎÄ¼þ£¬Ö»¶ÁÈëÕªÒªÐÅÏ¢£¬¼´±äÁ¿abs1 */
 	vector<string> vAbstract;
@@ -281,11 +274,13 @@ void CalcEntropy(int argc, const char** argv) {
 		for (auto& word : vWord) {
 			string upWord(word);
 			transform(upWord.begin(), upWord.end(), upWord.begin(), ::toupper);
-			// cout << upWord << endl;
 			vusAbsWord[i].insert(upWord);
 		}
 	}
+	finish = clock();
+	cout << "read abstract time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 	/* ½«·Ö¸î½á¹ûÐ´ÈëmatÎÄ¼þ */
+	begin = clock();
 	if (argc >= 6) {
 		MATFile* pMatFile = matOpen(argv[6], "w");
 		mxArray* pCellMtx= mxCreateCellMatrix(1, vvWordMtx.size());
@@ -297,21 +292,16 @@ void CalcEntropy(int argc, const char** argv) {
 			}
 			mxSetCell(pCellMtx, i, pChildCellMtx);
 		}
-		matPutVariable(pMatFile, "wd1", pCellMtx);
+		matPutVariable(pMatFile, "wd", pCellMtx);
 		matClose(pMatFile);
 		mxDestroyArray(pCellMtx);
 	}
 	finish = clock();
-	cout << "abstract time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
-	//auto & vTest = vvWordMtx[0];
-	//cout << vTest.size() << endl;
-	//for (auto& str : vTest) cout << str << endl;
-
+	cout << "write abstract word time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* ±éÀúËùÓÐµÄÖªÊ¶¿ÅÁ£Ä¿Â¼£¬ÖðÒ»½øÐÐ´¦Àí */
 	begin = clock();
-	ThreadPool thPool(numThread);
-	// ThreadPool thPool(24);
+	//ThreadPool thPool(numThread);
 	// ²é¿´ÖªÊ¶¿ÅÁ£ÊýÁ¿
 	int numKnowledgeParticle = 0;
 	FOREACH_PARTICLE_START
@@ -319,27 +309,21 @@ void CalcEntropy(int argc, const char** argv) {
 	FOREACH_PARTICLE_END
 
 	// ±éÀúÃ¿¸öÖªÊ¶¿ÅÁ££¬ÖðÒ»½øÐÐ´¦Àí
+	vector<ThreadParam> vTP;
 	for (int round = 0; round < 1; ++round) { // ²âÊÔÓÃ
 		int i = 0;
 		FOREACH_PARTICLE_START
-			ThreadParam tParam = { file, childDir / outFileName, &vusAbsWord };
-			thPool.enqueue(ThreadProcessData, tParam);
+			//ThreadParam tParam = { file, childDir / outFileName, &vusAbsWord };
+			//thPool.enqueue(ThreadProcessData, tParam);
+			vTP.push_back({ file, childDir / outFileName, &vusAbsWord });
 			i++;
 		FOREACH_PARTICLE_END
 	}
+	kt_for(numThread, ThreadProcessData, vTP);
 	
 	// synchronize
-	thPool.~ThreadPool();
+	//thPool.~ThreadPool();
 	finish = clock();
 
 	cout << "thread pool time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
-
-	//ofstream ofs("test_out.txt");
-	//for (auto& item : vEntropyResult) {
-	//	auto& vvEntropy = item.vvEntropy;
-	//	auto& vVal = vvEntropy[0];
-	//	for (auto& val : vVal) ofs << val << ' ';
-	//	ofs << endl;
-	//}
-	//ofs.close();
 }
\ No newline at end of file
diff --git a/CppRun/main.cpp b/CppRun/main.cpp
index c4eeece..d34d699 100644
--- a/CppRun/main.cpp
+++ b/CppRun/main.cpp
@@ -27,6 +27,7 @@ int main(int argc, const char** argv) {
 	}
 	else if (string(argv[1]) == "CalcEntropy") {
 		/* è®¡ç®—ä¿¡æ¯ç†µ */
+		cout << "CalcEntropy" << endl;
 		CalcEntropy(argc - 1, argv + 1);
 	}
 	finish = clock();
diff --git a/CppRun/process_pubmed_txt.cpp b/CppRun/process_pubmed_txt.cpp
index 8eb630c..2f62c14 100644
--- a/CppRun/process_pubmed_txt.cpp
+++ b/CppRun/process_pubmed_txt.cpp
@@ -14,7 +14,9 @@
 #include <unordered_map>
 #include <mat.h>
 #include "common.h"
+#include "CommonLib/thread_pool.h"
 #include "CommonLib/matlab_io.h"
+#include "CommonLib/kthread.h"
 using namespace std;
 
 /* å°†ç»“æžœå†™å…¥matæ–‡ä»¶ */
@@ -35,7 +37,7 @@ bool SavePubmed(const string& matPath,
 	}
 
 	// åˆ›å»ºç»“æž„ä½“æ•°æ®
-	mxArray* mxStruct = mxCreateStructMatrix(1, 1, vTgName.size(), vTgChars.data());
+	mxArray* mxStruct = mxCreateStructMatrix(1, 1, (int)vTgName.size(), vTgChars.data());
 	// åˆ›å»ºcell matrix
 	unordered_map<string, mxArray*> ummxCellMtx;
 	for (auto & tgName : vTgName) {
@@ -68,9 +70,45 @@ bool SavePubmed(const string& matPath,
 
 	return true;
 }
+/* å¤„ç†ä¸€ç¯‡æ–‡ç«  */
+struct ThreadParam { // çº¿ç¨‹å‚æ•°
+	unordered_map<string, string> *pumTagContent;
+	vector<string>* pvLineTag;
+	vector<string>* pvTgName;
+	int paperStartIdx;
+	int paperEndIdx;
+	unordered_map<string, string>* pumFullTagToTag;
+	vector<string>* pvStrPubmedTxt;
+};
+
+//void ThreadProcessArticle(vector<ThreadParam>& vTP, long idx, int tid) {
+void ThreadProcessArticle(ThreadParam& param) {
+	//ThreadParam& param = vTP[idx];
+	unordered_map<string, string>& umTagContent = *param.pumTagContent;
+	vector<string>& vLineTag = *param.pvLineTag;
+	vector<string>& vTgName = *param.pvTgName;
+	unordered_map<string, string>& umFullTagToTag = *param.pumFullTagToTag;
+	vector<string>& vStrPubmedTxt = *param.pvStrPubmedTxt;
+
+	int startIdx = param.paperStartIdx;
+	int endIdx = param.paperEndIdx;
+
+	for (int tgIdx = 0; tgIdx < vTgName.size(); ++tgIdx) {
+		umTagContent[vTgName[tgIdx]] = ""; // å¯¹æ¯ä¸€ä¸ªtagï¼Œè®¾ç½®ä¸€ä¸ªæ–°çš„string
+	}
+	for (int idx = startIdx; idx < endIdx; ++idx) { // éåŽ†å½“å‰æ–‡ç« çš„æ¯ä¸€ä¸ªtagå†…å®¹
+		string& fullTag = vLineTag[idx];
+		auto tagItr = umFullTagToTag.find(fullTag);
+		if (tagItr != umFullTagToTag.end()) { // æ‰¾åˆ°tagäº†
+			const string& tag = tagItr->second;
+			string& tagContent = umTagContent[tag];
+			tagContent.append(vStrPubmedTxt[idx]);
+		}
+	}
+}
 
 // å‘½ä»¤è¡Œå‚æ•°ç¤ºä¾‹
-// ProcessPubmedTxt d:\Twirls\gat1\literatures\pubmed_tag.mat D:\Twirls\runtime\negatives\pubmed-multiplesc-set.txt d:\pubmed_txt.mat
+// ProcessPubmedTxt d:\Twirls\gat1\literatures\pubmed_tag.mat D:\Twirls\runtime\negatives\pubmed-multiplesc-set.txt d:\pubmed_txt.mat 12
 /*
  pubmed txtæ–‡ä»¶ä¸­åŒ…å«å¤šä¸ªæ–‡ç« çš„æ‘˜è¦ä¿¡æ¯ï¼Œæ¯ä¸ªä¿¡æ¯æœ€å‰è¾¹æœ‰ä¸€ä¸ªtagï¼Œæ¯ä¸ªtagå¯¹åº”çš„ä¿¡æ¯å¯èƒ½æœ‰ä¸€è¡Œï¼Œä¹Ÿå¯èƒ½å¤šè¡Œï¼Œæ¯ä¸ªæ–‡ç« ä¸­é—´ç”±ä¸€ä¸ªç©ºè¡Œéš”å¼€
  1. è¯»å–é¢„å…ˆæå–çš„pubmed tags, å¹¶å°†tagsä¸­çš„'-'å’Œ' 'å­—ç¬¦åŽ»æŽ‰ï¼Œåªç•™ä¸‹çº¯å­—ç¬¦ä¸²åštag
@@ -81,11 +119,11 @@ bool SavePubmed(const string& matPath,
 void ProcessPubmedTxt(int argc, const char** argv) {
 	// argv 1.pubmed tag.matæ–‡ä»¶; 2.pubmed article.txtæ–‡ä»¶; 3.pubmed out.matè¾“å‡ºæ–‡ä»¶
 	// 
-	if (argc != 4) {
-		cout << "This program should take 3 arguments(1.pubmed tag.mat; 2. pubmed article.txt; 3. pubmed out.mat)!" << endl;
+	if (argc < 4) {
+		cout << "This program should take at least 3 arguments(1.pubmed tag.mat; 2. pubmed article.txt; 3. pubmed out.mat; [4. thread num])!" << endl;
 		return;
 	}
-
+	clock_t begin, finish;
 	int rowNum, colNum;
 	vector<string> vTg;
 	vector<string> vTgName;
@@ -94,6 +132,7 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 	/* è¯»å–pubmed tags */
 	ReadMtxString(argv[1], "tg", vTg, &rowNum, &colNum);
 	/* 1. åŽ»æŽ‰tagsé‡Œçš„'-'å’Œ' 'å­—ç¬¦ï¼Œå¾—åˆ°çº¯å‡€çš„tag */
+	begin = clock();
 	vTgName = vTg;
 	for (int i = 0; i < vTg.size(); ++i) {
 		int pos = 0;
@@ -105,6 +144,8 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 		vTgName[i].resize(pos);
 		umFullTagToTag[vTg[i]] = vTgName[i];
 	}
+	finish = clock();
+	cout << "process tag Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* 2. è¯»å–pubmed txtæ–‡ä»¶ï¼Œå…ˆè¯»å…¥åŽå¤„ç† */
 	ifstream ifsPubmedTxt(argv[2]);
@@ -117,6 +158,7 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 	int curPos = 0;
 	vPaperStartIdx.push_back(curPos); // æ·»åŠ åˆå§‹ç´¢å¼•
 	const int FULL_TAG_LEN = 5;
+	begin = clock();
 	while (getline(ifsPubmedTxt, strLine)) { // è¯»å–å†…å®¹æ—¶å€™åŽ»æŽ‰äº†è¡Œå°¾çš„æ¢è¡Œç¬¦
 		while (strLine.back() == ' ') strLine.pop_back(); // åŽ»æŽ‰è¡Œå°¾çš„ç©ºæ ¼
 		if (strLine.size() == 0) { // æ–°çš„paper
@@ -135,31 +177,27 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 		}
 	}
 	vPaperStartIdx.push_back(curPos); // æ¯”æ–‡ç« å¤š1ï¼Œæœ€åŽä¸€ä¸ªè®°å½•ç»“æŸä½ç½®
+	finish = clock();
+	cout << "read txt Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* å¤„ç†æ¯ä¸€ç¯‡æ–‡ç«  */
-	for (int i = 0; i < vPaperStartIdx.size() - 1; ++i) {
-		int startIdx = vPaperStartIdx[i];
-		int endIdx = vPaperStartIdx[i + 1];
-		unordered_map<string, string> umTagContent;
-
-		for (int tgIdx = 0; tgIdx < vTgName.size(); ++tgIdx) {
-			umTagContent[vTgName[tgIdx]] = ""; // å¯¹æ¯ä¸€ä¸ªtagï¼Œè®¾ç½®ä¸€ä¸ªæ–°çš„string
-		}
-		for (int idx = startIdx; idx < endIdx; ++idx) { // éåŽ†å½“å‰æ–‡ç« çš„æ¯ä¸€ä¸ªtagå†…å®¹
-			string& fullTag = vLineTag[idx];
-			auto tagItr = umFullTagToTag.find(fullTag);
-			if (tagItr != umFullTagToTag.end()) { // æ‰¾åˆ°tagäº†
-				const string& tag = tagItr->second;
-				string& tagContent = umTagContent[tag];
-				tagContent.append(vStrPubmedTxt[idx]);
-			}
-		}
-		vumPaperTagVal.push_back(umTagContent);
+	int numThread = 1;
+	if (argc >= 5) numThread = atoi(argv[4]);
+	if (numThread < 1) numThread = 1;
+	ThreadPool thPool(numThread);
+	vumPaperTagVal.resize(vPaperStartIdx.size()-1);
+	vector<thread> vT;
+	vector<ThreadParam> vTP(vPaperStartIdx.size() - 1);
+	begin = clock();
+	for (int i = 0; i < vTP.size(); ++i) {
+		vTP[i] = { &vumPaperTagVal[i], &vLineTag, &vTgName, vPaperStartIdx[i], vPaperStartIdx[i + 1], &umFullTagToTag, &vStrPubmedTxt };
 	}
-
-	// cout << "æ–‡ä»¶ä¸ªæ•°ï¼š" << vumPaperTagVal.size() << endl;
+	kt_for(numThread, ThreadProcessArticle, vTP);
+	finish = clock();
+	cout << "kt for Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* åŽ»é™¤æ²¡æœ‰æ‘˜è¦çš„æ–‡ç«  */
+	begin = clock();
 	const string abstractTag = "AB";
 	for (auto itr = vumPaperTagVal.begin(); itr != vumPaperTagVal.end(); ) {
 		if ((*itr)[abstractTag].size() == 0) {
@@ -169,8 +207,11 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 			itr++;
 		}
 	}
+	finish = clock();
+	cout << "remove no AB Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* æ ¹æ®PMIDï¼ŒåŽ»é™¤å†—ä½™ */
+	begin = clock();
 	unordered_map<string, int> umPMID;
 	const string pmidTag = "PMID";
 	for (auto itr = vumPaperTagVal.begin(); itr != vumPaperTagVal.end(); ) {
@@ -183,16 +224,25 @@ void ProcessPubmedTxt(int argc, const char** argv) {
 			itr++;
 		}
 	}
+	finish = clock();
+	cout << "remove duplication Total time : " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
 	/* å°†titleå’Œabstractåˆå¹¶ï¼Œèµ‹å€¼ç»™abstract */
+	begin = clock();
 	const string titleTag = "TI";
 	for (auto itr = vumPaperTagVal.begin(); itr != vumPaperTagVal.end(); itr++) {
 		string& abstractStr = (*itr)[abstractTag];
 		abstractStr = (*itr)[titleTag] + " " + abstractStr; // å¯èƒ½ä¼šæœ‰æ€§èƒ½æŸå¤±ï¼Œä¸è¿‡å½±å“ä¸å¤§
 	}
+	finish = clock();
+	cout << "merge abs and title Total time : " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 
+	// å…³é—­txtæ–‡ä»¶
 	ifsPubmedTxt.close();
 
 	/* å°†å¤„ç†åŽçš„æ•°æ®å†™å…¥matæ–‡ä»¶ï¼Œmatä¸­çš„å˜é‡åç§°åˆ†åˆ«ä¸ºTxå’Œabs1 */
+	begin = clock();
 	SavePubmed(argv[3], vTgName, vumPaperTagVal);
+	finish = clock();
+	cout << "write to MAT Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 }
\ No newline at end of file
diff --git a/GMM/main.cpp b/GMM/main.cpp
index 4f254cf..cd93d62 100644
--- a/GMM/main.cpp
+++ b/GMM/main.cpp
@@ -30,8 +30,9 @@
 #endif
 #include <mat.h>
 #include "gmm.h"
-#include "CommonLib/thread_pool.h"
+// #include "CommonLib/thread_pool.h"
 #include "CommonLib/matlab_io.h"
+#include "CommonLib/kthread.h"
 using namespace std;
 using std::cout;
 using std::vector;
@@ -144,7 +145,9 @@ struct ThreadParam {
 	fs::path matFilePath;
 	fs::path outFilePath;
 };
-void ThreadProcessData(const ThreadParam& param) {
+//void ThreadProcessData(vector<ThreadParam>& vTP, long idx, int tid) {
+void ThreadProcessData(ThreadParam& param) {
+	//const ThreadParam& param = vTP[idx];
 	const fs::path& matFilePath = param.matFilePath;
 	const fs::path& outFilePath = param.outFilePath;
 	double* hs = nullptr;
@@ -192,10 +195,10 @@ int main(int argc, const char** argv) {
 	int numThread = 1;
 	if (argc >= 4) numThread = atoi(argv[4]);
 	if (numThread < 1) numThread = 1;
-	ThreadPool thPool(numThread);
+	//ThreadPool thPool(numThread);
 	clock_t begin, finish;
 	begin = clock();
-
+	vector<ThreadParam> vTP;
 	/* ±éÀúËùÓÐµÄÖªÊ¶¿ÅÁ£Ä¿Â¼£¬ÖðÒ»½øÐÐ´¦Àí */
 	for (auto& childDir : fs::directory_iterator(parrentDir)) {
 		fs::path outFilePath = childDir / outFileName;
@@ -203,12 +206,14 @@ int main(int argc, const char** argv) {
 			const string& fileName = file.path().filename().string();
 			auto rPos = fileName.rfind(hsMatSuffix);
 			if (rPos != string::npos && fileName.size() - rPos == hsMatSuffix.size()) {
-				ThreadParam tParam = { file, outFilePath };
-				thPool.enqueue(ThreadProcessData, tParam);
+				//ThreadParam tParam = { file, outFilePath };
+				//thPool.enqueue(ThreadProcessData, tParam);
+				vTP.push_back({ file, outFilePath });
 			}
 		}
 	}
-	thPool.~ThreadPool();
+	kt_for(numThread, ThreadProcessData, vTP);
+	//thPool.~ThreadPool();
 	finish = clock();
 	cout << "GMM Total time: " << (double)(finish - begin) / CLOCKS_PER_SEC << " s" << endl;
 	return 0;