| 54 |
Create table pubchem.nci_h23 (
"sid" Integer,
"ext_datasource_regid" Integer,
"cid" Integer,
"activity_outcome" Integer,
"activity_score" Integer,
"activity_url" Text,
"assaydata_comment" Text,
"assaydata_revoke" Text,
"log_gi50_M" Numeric,
"log_gi50_ugml" Numeric,
"log_gi50_v" Numeric,
"indngi50" Integer,
"stddevgi50" Numeric,
"logtgi_m" Numeric,
"logtgi_ugml" Numeric,
"logtgi_v" Numeric,
"indntgi" Integer,
"stddevtgi" Numeric
);
Comment on table pubchem.nci_h23 is
'Growth inhibition of the NCI_H23 human Non-Small Cell Lung tumor cell line is measured as a screen
for anti-cancer activity. Cells are grown in 96 well plates and exposed to the test compound for 48 hours.
Compounds are tested at 5 different concentrations and three endpoints are estimated from this
dose response curve: GI50, concentration required for 50% inhibition of growth, TGI,
the concentration requires for complete inhibition of growth, and LC50, the concentration
required for 50% reduction in cell number. These estimates are done by simple linear interpolation
between the concentrations that surround the appropriate level.
If a compound doesn’’t cause inhibition to the appropriate level, the endpoint is set to the highest
concentration tested.';
Comment on column pubchem.nci_h23."sid" is 'PubChem Substance ID SID';
Comment on column pubchem.nci_h23."ext_datasource_regid" is
'Space holder for PubChem external datasource RegID, empty by default';
Comment on column pubchem.nci_h23."cid" is 'Pubchem Compound ID'; |
| 56 |
Select sid, activity_outcome, "log_gi50_M", log_gi50_ugml
from nci_h23 where activity_outcome = 2;
Create Table substance (
Title text,
BONDANNOTATIONS text,
CID_ASSOCIATIONS text,
COMPOUND_ID_TYPE integer,
EXT_DATASOURCE_NAME text,
EXT_DATASOURCE_REGID text,
EXT_DATASOURCE_URL text,
EXT_SUBSTANCE_URL text,
GENBANK_NUCLEOTIDE_ID text,
GENBANK_PROTEIN_ID text,
GENERIC_REGISTRY_NAME text,
PUBMED_ID text,
SUBSTANCE_COMMENT text,
SUBSTANCE_ID integer,
SUBSTANCE_SYNONYM text,
SUBSTANCE_VERSION integer,
TOTAL_CHARGE integer,
XREF_EXT_ID text);
Copy substance (
Title,
BONDANNOTATIONS,
CID_ASSOCIATIONS,
COMPOUND_ID_TYPE,
EXT_DATASOURCE_NAME,
EXT_DATASOURCE_REGID,
EXT_DATASOURCE_URL,
EXT_SUBSTANCE_URL,
GENBANK_NUCLEOTIDE_ID,
GENBANK_PROTEIN_ID,
GENERIC_REGISTRY_NAME,
PUBMED_ID,
SUBSTANCE_COMMENT,
SUBSTANCE_ID,
SUBSTANCE_SYNONYM,
SUBSTANCE_VERSION,
TOTAL_CHARGE,
XREF_EXT_ID)
from stdin delimiter ',';
1,\N,449635 1,0,MOLI,MOLI000002,\N,\N,\N,\N,\N,\N,MOLI - NCI Molecular Imaging Agents\nFGCV,1,MOLI000002,1,0,MOLI000002
2,2 11 5\n20 34 5\n25 31 6\n28 55 5\n5 13 6\n58 59 6\n8 33 5,\N,0,MOLI,MOLI000003,\N,\N,\N,\N,\N,\N,MOLI - NCI Molecular Imaging Agents\n[99mTc]-P2S2-BBN(7-14),2,MOLI000003,1,0,MOLI000003 |
| 64 |
Select id,smiles,mw From atable Where mw < 500;
Select id,smiles,mw,logp From atable Where
(logp > 0 And mw < 500) Or
(logp < 0 And mw < 580);
Select
n.sid, n.activity_outcome, n."log_gi50_M", n.log_gi50_ugml
From
nci_h23 n
Where activity_outcome = 2
Order By sid;
Select
n.sid, n.activity_outcome, n."log_gi50_M", n.log_gi50_ugml,
s.ext_datasource_name, s.ext_datasource_regid
From
nci_h23 n
Join substance s On s.substance_id = n.sid
Where activity_outcome = 2
Order By sid; |
| 65 |
Select
n.sid, n.activity_outcome, n."log_gi50_M", n.log_gi50_ugml,
s.ext_datasource_name, s.ext_datasource_regid,
sc.compound_id, sc.compound_type
From
nci_h23 n
Join substance s On s.substance_id = n.sid
Join substance_compound sc On sc.substance_id = s.substance_id
Where activity_outcome = 2
Order By sid;
Select
n.sid, n.activity_outcome, n."log_gi50_M", n.log_gi50_ugml,
s.ext_datasource_name, s.ext_datasource_regid,
sc.compound_id, sc.compound_type,
c.openeye_can_smiles
From
nci_h23 n
Join substance s On s.substance_id = n.sid
Join substance_compound sc On sc.substance_id = s.substance_id
Join compound c On c.cid = sc.compound_id
Where activity_outcome = 2
Order By sid; |