• 利用化合物名称从PubChempy中批量下载化合物信息


    # -*- coding: utf-8 -*-
    """
    Created on Tue Nov  8 13:07:40 2022
    
    @author: Administrator
    """
    
    from pubchempy import get_compounds, Compound
    
    for compound in get_compounds('2-(1H-indol-3-yl)acetic acid', 'name'):
        b1 = compound.cid
        c1 = compound.isomeric_smiles
        d1 = compound.molecular_formula
        e1 = compound.molecular_weight
        f1 = compound.iupac_name
        
    
    print(compound.cid)
    print(compound.molecular_weight)
    print(compound.molecular_formula)
    print(compound.isomeric_smiles)
    print(compound.iupac_name)
    
    
    • 1
    • 2
    • 3
    • 4
    • 5
    • 6
    • 7
    • 8
    • 9
    • 10
    • 11
    • 12
    • 13
    • 14
    • 15
    • 16
    • 17
    • 18
    • 19
    • 20
    • 21
    • 22
    • 23
    # -*- coding: utf-8 -*-
    """
    Created on Tue Nov  8 13:30:10 2022
    
    @author: Administrator
    """
    
    from pubchempy import get_compounds, Compound
    
    import pandas as pd
    a = pd.read_excel("G:\\非靶向代谢组数据库\\wheat\\wheat2.xlsx")
    a = a['Metabolites']
    for i in a:
        for compound in get_compounds(i, 'name'):
            b1 = compound.cid
            c1 = compound.isomeric_smiles
            d1 = compound.molecular_formula
            e1 = compound.molecular_weight
            f1 = compound.iupac_name
        print(compound.cid)
        print(compound.molecular_weight)
        print(compound.molecular_formula)
        print(compound.isomeric_smiles)
        print(compound.iupac_name)
    
        
    
    • 1
    • 2
    • 3
    • 4
    • 5
    • 6
    • 7
    • 8
    • 9
    • 10
    • 11
    • 12
    • 13
    • 14
    • 15
    • 16
    • 17
    • 18
    • 19
    • 20
    • 21
    • 22
    • 23
    • 24
    • 25
    • 26
    # -*- coding: utf-8 -*-
    """
    Created on Tue Nov  8 13:30:10 2022
    
    @author: Administrator
    """
    
    from pubchempy import get_compounds, Compound
    
    import pandas as pd
    a = pd.read_excel("G:\\非靶向代谢组数据库\\wheat\\wheat2.xlsx")
    a = a['Metabolites']
    list1 = list()
    list2 = list()
    list3 = list()
    list4 = list()
    list5 = list()
    for i in range(0, 704):
        for compound in get_compounds(a[i], 'name'):
            b1 = compound.cid
            c1 = compound.isomeric_smiles
            d1 = compound.molecular_formula
            e1 = compound.molecular_weight
            f1 = compound.iupac_name
        print(compound.cid)
        print(compound.molecular_weight)
        print(compound.molecular_formula)
        print(compound.isomeric_smiles)
        print(compound.iupac_name)
        print(i)
        list1.append(b1)
        list2.append(c1)
        list3.append(d1)
        list4.append(e1)
        list5.append(f1)
    
    information = pd.DataFrame(list1,list2,list3,list4,list5)
    
    
    • 1
    • 2
    • 3
    • 4
    • 5
    • 6
    • 7
    • 8
    • 9
    • 10
    • 11
    • 12
    • 13
    • 14
    • 15
    • 16
    • 17
    • 18
    • 19
    • 20
    • 21
    • 22
    • 23
    • 24
    • 25
    • 26
    • 27
    • 28
    • 29
    • 30
    • 31
    • 32
    • 33
    • 34
    • 35
    • 36
    • 37
    • 38
    # -*- coding: utf-8 -*-
    """
    Created on Tue Nov  8 15:48:20 2022
    
    @author: Administrator
    """
    
    # -*- coding: utf-8 -*-
    """
    Created on Tue Nov  8 13:30:10 2022
    
    @author: Administrator
    """
    
    from pubchempy import get_compounds, Compound
    
    import pandas as pd
    a = pd.read_excel("G:\\非靶向代谢组数据库\\wheat\\wheat2.xlsx")
    a = a['Metabolites']
    list1 = list()
    list2 = list()
    list3 = list()
    list4 = list()
    list5 = list()
    for i in range(110, 704):
        for compound in get_compounds(a[i], 'name'):
            b1 = compound.cid
            c1 = compound.isomeric_smiles
            d1 = compound.molecular_formula
            e1 = compound.molecular_weight
            f1 = compound.iupac_name
        print(compound.cid)
        print(compound.molecular_weight)
        print(compound.molecular_formula)
        print(compound.isomeric_smiles)
        print(compound.iupac_name)
        print(i)
        list1.append(b1)
        list2.append(c1)
        list3.append(d1)
        list4.append(e1)
        list5.append(f1)
    
    
    import pandas as pd
    import numpy as np
    information = pd.DataFrame({'PubChem_CID':list1, 'molecular_weight':list2, 
                                'molecular_formula':list3, 'isomeric_smiles':list4,
                                'iupac_name':list5})
    information
    information.to_excel('e:/count/example2.xlsx')
    
    
    • 1
    • 2
    • 3
    • 4
    • 5
    • 6
    • 7
    • 8
    • 9
    • 10
    • 11
    • 12
    • 13
    • 14
    • 15
    • 16
    • 17
    • 18
    • 19
    • 20
    • 21
    • 22
    • 23
    • 24
    • 25
    • 26
    • 27
    • 28
    • 29
    • 30
    • 31
    • 32
    • 33
    • 34
    • 35
    • 36
    • 37
    • 38
    • 39
    • 40
    • 41
    • 42
    • 43
    • 44
    • 45
    • 46
    • 47
    • 48
    • 49
    • 50
    • 51
    • 52
  • 相关阅读:
    MySQL夺命66问,面试必看!(荣耀典藏版)
    AP5186 三功能 LED 降压型恒流芯片 手电筒 LED芯片
    Linux 常用操作
    SCS【1】今天开启单细胞之旅,述说单细胞测序的前世今生
    了解如何利用来自 ADAudit Plus 的基本用户登录报告:登录失败
    STM32 LwIP学习过程问题总结(一):LwIP ping不通,抓包发现ICMP校验和为0x0000
    LeetCode221112_124、844.比较含退格的字符串
    《大数据分析技术》教学上机实验报告
    文献阅读(207)FPGA HBM
    Jenkins使用pipeline部署服务到远程服务器
  • 原文地址:https://blog.csdn.net/weixin_47634487/article/details/127752300