Skip to content
This repository was archived by the owner on Jun 18, 2022. It is now read-only.

Commit 456c9fb

Browse files
author
Dmitriy "DK" Korobskiy
committed
Merge remote-tracking branch 'origin/master'
2 parents 4b81431 + 774fd10 commit 456c9fb

1 file changed

Lines changed: 21 additions & 22 deletions

File tree

Analysis/affymetrix/garfield_import_dmet_twog.sql

Lines changed: 21 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -59,15 +59,16 @@ FROM garfield_dmet_begin a INNER JOIN wos_references b ON a.target=b.source_id;
5959
-- Inner join on wos_pubs to get only viable references (complete WoS Ids)
6060
DROP TABLE IF EXISTS garfield_dmet_twog;
6161
CREATE TABLE garfield_dmet_twog AS
62-
SELECT a.* FROM garfield_dmet_twog_a INNER JOIN
63-
wos_publications_b ON a.target=b.source_id;
62+
SELECT a.* FROM garfield_dmet_twog_a a INNER JOIN
63+
wos_publications b ON a.target=b.source_id;
6464

6565
-- begin node list assembly process.
6666
DROP TABLE IF EXISTS garfield_node_assembly;
6767
CREATE TABLE garfield_node_assembly(node_id varchar(16),
6868
node_name varchar(19),stype varchar(10),ttype varchar(10));
6969

7070
--build node_table
71+
-- insert from end point
7172
--gen1
7273
INSERT INTO garfield_node_assembly(node_id,node_name,stype)
7374
SELECT DISTINCT 'n'||substring(source,5),source,stype
@@ -86,14 +87,24 @@ INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
8687
SELECT DISTINCT 'n'||substring(target,5),target,ttype
8788
FROM garfield_gen2;
8889

89-
--garfield_dmet_begin
90+
-- insert from start point (dmet plus)
91+
-- garfield_dmet_begin
9092
INSERT INTO garfield_node_assembly(node_id,node_name,stype)
9193
SELECT DISTINCT 'n'||substring(source,5),source,stype
9294
FROM garfield_dmet_begin;
9395

9496
INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
9597
SELECT DISTINCT 'n'||substring(target,5),target,ttype
9698
FROM garfield_dmet_begin;
99+
100+
-- gen1_cited
101+
INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
102+
SELECT DISTINCT 'n'||substring(source,5),source,stype
103+
FROM garfield_dmet_twog;
104+
105+
INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
106+
SELECT DISTINCT 'n'||substring(target,5),target,ttype
107+
FROM garfield_dmet_twog;
97108
CREATE INDEX garfield_node_assembly_idx ON garfield_node_assembly(node_id);
98109

99110
DROP TABLE IF EXISTS garfield_nodelist;
@@ -116,6 +127,10 @@ FROM garfield_gen2;
116127
INSERT INTO garfield_edge_table SELECT 'n'||substring(source,5) AS snid,
117128
'n'||substring(target,5) as tnid, source, target, stype, ttype
118129
FROM garfield_dmet_begin;
130+
131+
INSERT INTO garfield_edge_table SELECT 'n'||substring(source,5) AS snid,
132+
'n'||substring(target,5) as tnid, source, target, stype, ttype
133+
FROM garfield_dmet_twog;
119134
CREATE INDEX garfield_edge_table_idx ON garfield_edge_table(snid,tnid);
120135

121136
DROP TABLE IF EXISTS garfield_edgelist;
@@ -143,23 +158,6 @@ CREATE TABLE garfield_nodelist_formatted_b_pmid AS
143158
SELECT a.*,b.pmid_int FROM garfield_nodelist_formatted_b a
144159
LEFT JOIN wos_pmid_mapping b ON a.node_name=b.wos_id;
145160

146-
/*
147-
DROP TABLE IF EXISTS garfield_nodelist_formatted_b_pmid_grants;
148-
CREATE TABLE garfield_nodelist_formatted_b_pmid_grants AS
149-
SELECT a.*,b.project_number FROM garfield_nodelist_formatted_b_pmid a
150-
LEFT JOIN exporter_publink b ON a.pmid_int=b.pmid::int;
151-
152-
ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN ic varchar(2);
153-
ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN nida varchar(10);
154-
ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN other_nih varchar(10);
155-
156-
UPDATE garfield_nodelist_formatted_b_pmid_grants SET ic=substring(project_number,4,2);
157-
UPDATE garfield_nodelist_formatted_b_pmid_grants SET nida='1' WHERE ic='DA';
158-
UPDATE garfield_nodelist_formatted_b_pmid_grants SET nida='0' WHERE nida IS NULL;
159-
UPDATE garfield_nodelist_formatted_b_pmid_grants SET other_nih='1' WHERE ic IS NOT NULL AND nida='0';
160-
UPDATE garfield_nodelist_formatted_b_pmid_grants SET other_nih='0' WHERE other_nih IS NULL;
161-
*/
162-
163161
DROP TABLE IF EXISTS garfield_nodelist_formatted_b_pmid_grants;
164162
CREATE TABLE garfield_nodelist_formatted_b_pmid_grants AS
165163
SELECT
@@ -218,10 +216,11 @@ COPY (
218216
publication_year AS "publication_year:int",
219217
total_citation_count AS "total_citations:int"
220218
FROM chackoge.garfield_nodelist_final_citation
221-
) TO '/tmp/garfield_nodelist_final.csv' WITH (FORMAT CSV, HEADER);
219+
) TO '/tmp/garfield_nodelist_2g_final.csv' WITH (FORMAT CSV, HEADER);
222220

223221
COPY (
224222
SELECT source AS ":START_ID",
225223
target AS ":END_ID"
226224
FROM chackoge.garfield_edgelist
227-
) TO '/tmp/garfield_edgelist_final.csv' WITH (FORMAT CSV, HEADER);
225+
) TO '/tmp/garfield_edgelist_2g_final.csv' WITH (FORMAT CSV, HEADER);
226+

0 commit comments

Comments
 (0)