{"id":"https://openalex.org/W4416256122","doi":"https://doi.org/10.48550/arxiv.2509.19834","title":"TianHui: A Domain-Specific Large Language Model for Diverse Traditional Chinese Medicine Scenarios","display_name":"TianHui: A Domain-Specific Large Language Model for Diverse Traditional Chinese Medicine Scenarios","publication_year":2025,"publication_date":"2025-09-24","ids":{"openalex":"https://openalex.org/W4416256122","doi":"https://doi.org/10.48550/arxiv.2509.19834"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2509.19834","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19834","pdf_url":"https://arxiv.org/pdf/2509.19834","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.19834","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102068680","display_name":"Yin Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yin, Ji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005891103","display_name":"Menglan He","orcid":"https://orcid.org/0000-0002-7270-9583"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Menglan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101566112","display_name":"Yujie Zhang","orcid":"https://orcid.org/0000-0003-1805-8342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yujie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101688256","display_name":"Linshuai Zhang","orcid":"https://orcid.org/0000-0002-8877-0936"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Linshuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101812242","display_name":"Tingting Ma","orcid":"https://orcid.org/0000-0002-8488-651X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Tingting","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051956004","display_name":"Chuanshan Tian","orcid":"https://orcid.org/0000-0003-3341-1378"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Ce","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100600528","display_name":"Jie Wu","orcid":"https://orcid.org/0000-0002-3472-1717"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112987496","display_name":"Lin Xu","orcid":"https://orcid.org/0000-0002-4023-4106"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Lin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Jiang, Tao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Tao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5102068680"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12647","display_name":"Traditional Chinese Medicine Studies","score":0.5823000073432922,"subfield":{"id":"https://openalex.org/subfields/2707","display_name":"Complementary and alternative medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T12647","display_name":"Traditional Chinese Medicine Studies","score":0.5823000073432922,"subfield":{"id":"https://openalex.org/subfields/2707","display_name":"Complementary and alternative medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.07989999651908875,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.03420000150799751,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5246999859809875},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5239999890327454},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5012999773025513},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4672999978065491},{"id":"https://openalex.org/keywords/traditional-chinese-medicine","display_name":"Traditional Chinese medicine","score":0.39969998598098755},{"id":"https://openalex.org/keywords/chinese-language","display_name":"Chinese language","score":0.36559998989105225},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.35019999742507935},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.30550000071525574}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7207000255584717},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5882999897003174},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5239999890327454},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5012999773025513},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49779999256134033},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4684999883174896},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4672999978065491},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.42750000953674316},{"id":"https://openalex.org/C188947578","wikidata":"https://www.wikidata.org/wiki/Q200253","display_name":"Traditional Chinese medicine","level":3,"score":0.39969998598098755},{"id":"https://openalex.org/C3018428822","wikidata":"https://www.wikidata.org/wiki/Q7850","display_name":"Chinese language","level":2,"score":0.36559998989105225},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.35019999742507935},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.30550000071525574},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2976999878883362},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.29580000042915344},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C105002631","wikidata":"https://www.wikidata.org/wiki/Q4833645","display_name":"Subject-matter expert","level":3,"score":0.26579999923706055},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2624000012874603},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25999999046325684},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.2567000091075897},{"id":"https://openalex.org/C2777220311","wikidata":"https://www.wikidata.org/wiki/Q6423340","display_name":"Knowledge acquisition","level":2,"score":0.25049999356269836}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2509.19834","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19834","pdf_url":"https://arxiv.org/pdf/2509.19834","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.19834","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.19834","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.19834","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19834","pdf_url":"https://arxiv.org/pdf/2509.19834","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Domain-specific":[0],"LLMs":[1],"in":[2,6,73,89],"TCM":[3,26,41,119],"face":[4],"limitations":[5],"research":[7],"settings":[8],"due":[9],"to":[10],"constrained":[11],"adaptability,":[12],"insufficient":[13],"evaluation":[14],"datasets,":[15],"and":[16,33,50,61,85,115],"limited":[17],"computational":[18],"resources.":[19],"This":[20],"study":[21],"presents":[22],"TianHui,":[23],"a":[24,39,52],"specialized":[25],"LLM":[27],"built":[28],"through":[29],"contextual":[30],"data":[31,45],"integration":[32],"domain":[34],"knowledge":[35],"fusion.":[36],"We":[37],"constructed":[38],"large-scale":[40],"corpus":[42],"(0.97GB":[43],"unsupervised":[44],"+":[46],"611,312":[47],"QA":[48],"pairs)":[49],"employed":[51],"two-stage":[53],"training":[54],"strategy":[55],"with":[56],"QLoRA,":[57],"DeepSpeed":[58],"Stage":[59],"2,":[60],"Flash":[62],"Attention":[63],"2.":[64],"Evaluation":[65],"on":[66],"12":[67],"benchmarks":[68],"showed":[69],"TianHui":[70,111],"ranked":[71],"top-three":[72],"all":[74],"metrics":[75],"for":[76],"six":[77,92],"datasets":[78],"(APQ,":[79],"TCMCD,":[80],"HFR,":[81],"HCCA,":[82],"DHPE,":[83],"TLAW)":[84],"achieved":[86],"top":[87],"results":[88],"the":[90],"other":[91],"(TCMEE,":[93],"APR,":[94],"GCPMI,":[95],"TCMKQA,":[96],"TCMRC,":[97],"ADTG).":[98],"Optimal":[99],"configuration":[100],"was":[101],"identified":[102],"as":[103],"LoRA":[104],"rank=128,":[105],"alpha=256,":[106],"epoch=4,":[107],"dropout=0.2,":[108],"max":[109],"length=2048.":[110],"enables":[112],"systematic":[113],"preservation":[114],"scalable":[116],"application":[117],"of":[118],"knowledge.":[120],"All":[121],"resources":[122],"are":[123],"open-sourced.":[124]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2025-10-10T00:00:00"}
