{"id":"https://openalex.org/W4306976400","doi":"https://doi.org/10.1186/s13321-022-00650-3","title":"A fingerprints based molecular property prediction method using the BERT model","display_name":"A fingerprints based molecular property prediction method using the BERT model","publication_year":2022,"publication_date":"2022-10-21","ids":{"openalex":"https://openalex.org/W4306976400","doi":"https://doi.org/10.1186/s13321-022-00650-3","pmid":"https://pubmed.ncbi.nlm.nih.gov/36271394"},"language":"en","primary_location":{"id":"doi:10.1186/s13321-022-00650-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-022-00650-3","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-022-00650-3","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-022-00650-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091740913","display_name":"Naifeng Wen","orcid":"https://orcid.org/0000-0003-2725-8645"},"institutions":[{"id":"https://openalex.org/I61565387","display_name":"Dalian Minzu University","ror":"https://ror.org/02hxfx521","country_code":"CN","type":"education","lineage":["https://openalex.org/I61565387"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Naifeng Wen","raw_affiliation_strings":["School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China","institution_ids":["https://openalex.org/I61565387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070822882","display_name":"Guanqun Liu","orcid":"https://orcid.org/0000-0003-2520-7625"},"institutions":[{"id":"https://openalex.org/I61565387","display_name":"Dalian Minzu University","ror":"https://ror.org/02hxfx521","country_code":"CN","type":"education","lineage":["https://openalex.org/I61565387"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanqun Liu","raw_affiliation_strings":["School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China","institution_ids":["https://openalex.org/I61565387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100436650","display_name":"Jie Zhang","orcid":"https://orcid.org/0000-0001-8264-5950"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Zhang","raw_affiliation_strings":["Beijing Huawei Digital Technologies Co., Ltd, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Huawei Digital Technologies Co., Ltd, Beijing, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101735545","display_name":"Rubo Zhang","orcid":"https://orcid.org/0000-0002-3211-6273"},"institutions":[{"id":"https://openalex.org/I61565387","display_name":"Dalian Minzu University","ror":"https://ror.org/02hxfx521","country_code":"CN","type":"education","lineage":["https://openalex.org/I61565387"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rubo Zhang","raw_affiliation_strings":["School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China. zhangrubo@dlnu.edu.cn","School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China. zhangrubo@dlnu.edu.cn","institution_ids":[]},{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China","institution_ids":["https://openalex.org/I61565387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089658787","display_name":"Yating Fu","orcid":"https://orcid.org/0009-0004-7509-6518"},"institutions":[{"id":"https://openalex.org/I61565387","display_name":"Dalian Minzu University","ror":"https://ror.org/02hxfx521","country_code":"CN","type":"education","lineage":["https://openalex.org/I61565387"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yating Fu","raw_affiliation_strings":["School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China","institution_ids":["https://openalex.org/I61565387"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007086045","display_name":"Xu Han","orcid":"https://orcid.org/0000-0003-4417-9340"},"institutions":[{"id":"https://openalex.org/I61565387","display_name":"Dalian Minzu University","ror":"https://ror.org/02hxfx521","country_code":"CN","type":"education","lineage":["https://openalex.org/I61565387"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Han","raw_affiliation_strings":["School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical and Electronic Engineering, Dalian Minzu University, Dalian, China","institution_ids":["https://openalex.org/I61565387"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5091740913"],"corresponding_institution_ids":["https://openalex.org/I61565387"],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":10.6658,"has_fulltext":true,"cited_by_count":73,"citation_normalized_percentile":{"value":0.98820694,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"14","issue":"1","first_page":"71","last_page":"71"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.838703989982605},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6809351444244385},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6392298936843872},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.6363363265991211},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6113982796669006},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6023259162902832},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5681051015853882},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4666825234889984},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.44418638944625854},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4432596266269684},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.44184941053390503},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.44125092029571533},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.44043588638305664},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4174797534942627},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41028547286987305},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07441669702529907}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.838703989982605},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6809351444244385},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6392298936843872},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.6363363265991211},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6113982796669006},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6023259162902832},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5681051015853882},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4666825234889984},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.44418638944625854},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4432596266269684},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.44184941053390503},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.44125092029571533},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.44043588638305664},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4174797534942627},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41028547286987305},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07441669702529907},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1186/s13321-022-00650-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-022-00650-3","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-022-00650-3","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmid:36271394","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36271394","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of cheminformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:00d73938472b4809924a25932179a43f","is_oa":true,"landing_page_url":"https://doaj.org/article/00d73938472b4809924a25932179a43f","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Cheminformatics, Vol 14, Iss 1, Pp 1-13 (2022)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:9585730","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9585730","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Cheminform","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13321-022-00650-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-022-00650-3","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-022-00650-3","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3414326597","display_name":null,"funder_award_id":"61673084","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8774092211","display_name":null,"funder_award_id":"MD-IPAC-2019103","funder_id":"https://openalex.org/F4320336732","funder_display_name":"Key Laboratory of Intelligent Perception and Advanced Control of State Ethnic Affairs Commission"},{"id":"https://openalex.org/G8942021038","display_name":null,"funder_award_id":"2020-MS-135","funder_id":"https://openalex.org/F4320323086","funder_display_name":"Natural Science Foundation of Liaoning Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323086","display_name":"Natural Science Foundation of Liaoning Province","ror":null},{"id":"https://openalex.org/F4320330200","display_name":"National Ethnic Affairs Commission of the People's Republic of China","ror":"https://ror.org/01p9g6b97"},{"id":"https://openalex.org/F4320336732","display_name":"Key Laboratory of Intelligent Perception and Advanced Control of State Ethnic Affairs Commission","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4306976400.pdf","grobid_xml":"https://content.openalex.org/works/W4306976400.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W1988037271","https://openalex.org/W1999798000","https://openalex.org/W2008505552","https://openalex.org/W2048080607","https://openalex.org/W2060531713","https://openalex.org/W2076498053","https://openalex.org/W2134164499","https://openalex.org/W2406943157","https://openalex.org/W2594183968","https://openalex.org/W2751756351","https://openalex.org/W2777416523","https://openalex.org/W2943890584","https://openalex.org/W2962876364","https://openalex.org/W2966357564","https://openalex.org/W2969457089","https://openalex.org/W2973114758","https://openalex.org/W2986232138","https://openalex.org/W3037888463","https://openalex.org/W3109892317","https://openalex.org/W3191637674","https://openalex.org/W4221074165","https://openalex.org/W4221160432","https://openalex.org/W4224220091","https://openalex.org/W4226159083","https://openalex.org/W4290930066","https://openalex.org/W6600451497"],"related_works":["https://openalex.org/W2081900870","https://openalex.org/W4390516098","https://openalex.org/W2037549926","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2345479200","https://openalex.org/W2183306018","https://openalex.org/W2142795561","https://openalex.org/W2849310602","https://openalex.org/W4205302943"],"abstract_inverted_index":{"Molecular":[0],"property":[1],"prediction":[2,34,119],"(MPP)":[3],"is":[4,74],"vital":[5],"in":[6,61],"drug":[7,10],"discovery":[8],"and":[9,33,87,127],"reposition.":[11],"Deep":[12],"learning-based":[13],"MPP":[14,38,106],"models":[15],"capture":[16],"molecular":[17,69],"property-related":[18],"features":[19],"from":[20,46],"various":[21],"molecule":[22,30,93],"representations.":[23],"In":[24],"this":[25],"paper,":[26],"we":[27],"propose":[28],"a":[29,42,62],"sequence":[31],"embedding":[32],"model":[35,116],"facing":[36],"with":[37,109],"task.":[39],"We":[40],"pre-trained":[41],"bi-directional":[43],"encoder":[44,49],"representations":[45],"Transformers":[47],"(BERT)":[48],"to":[50,76,82],"obtain":[51],"the":[52,67,72,77,88,92,110,114,124],"semantic":[53],"representation":[54,70],"of":[55,91,123],"compound":[56],"fingerprints,":[57],"called":[58],"Fingerprints-BERT":[59],"(FP-BERT),":[60],"self-supervised":[63],"learning":[64],"manner.":[65],"Then,":[66],"encoded":[68],"by":[71],"FP-BERT":[73],"input":[75],"convolutional":[78],"neural":[79],"network":[80],"(CNN)":[81],"extract":[83],"higher-level":[84],"abstract":[85],"features,":[86],"predicted":[89],"properties":[90],"are":[94],"finally":[95],"obtained":[96],"through":[97],"fully":[98],"connected":[99],"layer":[100],"for":[101],"distinct":[102],"classification":[103,125],"or":[104],"regression":[105,128],"tasks.":[107,129],"Comparison":[108],"baselines":[111],"shows":[112],"that":[113],"proposed":[115],"achieves":[117],"high":[118],"performance":[120],"on":[121],"all":[122],"tasks":[126]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":31},{"year":2023,"cited_by_count":10}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
