@@ -59,15 +59,16 @@ FROM garfield_dmet_begin a INNER JOIN wos_references b ON a.target=b.source_id;
5959-- Inner join on wos_pubs to get only viable references (complete WoS Ids)
6060DROP TABLE IF EXISTS garfield_dmet_twog;
6161CREATE TABLE garfield_dmet_twog AS
62- SELECT a.* FROM garfield_dmet_twog_a INNER JOIN
63- wos_publications_b ON a .target = b .source_id ;
62+ SELECT a.* FROM garfield_dmet_twog_a a INNER JOIN
63+ wos_publications b ON a .target = b .source_id ;
6464
6565-- begin node list assembly process.
6666DROP TABLE IF EXISTS garfield_node_assembly;
6767CREATE TABLE garfield_node_assembly (node_id varchar (16 ),
6868node_name varchar (19 ),stype varchar (10 ),ttype varchar (10 ));
6969
7070-- build node_table
71+ -- insert from end point
7172-- gen1
7273INSERT INTO garfield_node_assembly(node_id,node_name,stype)
7374SELECT DISTINCT ' n' || substring (source,5 ),source,stype
@@ -86,14 +87,24 @@ INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
8687SELECT DISTINCT ' n' || substring (target,5 ),target,ttype
8788FROM garfield_gen2;
8889
89- -- garfield_dmet_begin
90+ -- insert from start point (dmet plus)
91+ -- garfield_dmet_begin
9092INSERT INTO garfield_node_assembly(node_id,node_name,stype)
9193SELECT DISTINCT ' n' || substring (source,5 ),source,stype
9294FROM garfield_dmet_begin;
9395
9496INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
9597SELECT DISTINCT ' n' || substring (target,5 ),target,ttype
9698FROM garfield_dmet_begin;
99+
100+ -- gen1_cited
101+ INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
102+ SELECT DISTINCT ' n' || substring (source,5 ),source,stype
103+ FROM garfield_dmet_twog;
104+
105+ INSERT INTO garfield_node_assembly(node_id,node_name,ttype)
106+ SELECT DISTINCT ' n' || substring (target,5 ),target,ttype
107+ FROM garfield_dmet_twog;
97108CREATE INDEX garfield_node_assembly_idx ON garfield_node_assembly(node_id);
98109
99110DROP TABLE IF EXISTS garfield_nodelist;
@@ -116,6 +127,10 @@ FROM garfield_gen2;
116127INSERT INTO garfield_edge_table SELECT ' n' || substring (source,5 ) AS snid,
117128' n' || substring (target,5 ) as tnid, source, target, stype, ttype
118129FROM garfield_dmet_begin;
130+
131+ INSERT INTO garfield_edge_table SELECT ' n' || substring (source,5 ) AS snid,
132+ ' n' || substring (target,5 ) as tnid, source, target, stype, ttype
133+ FROM garfield_dmet_twog;
119134CREATE INDEX garfield_edge_table_idx ON garfield_edge_table(snid,tnid);
120135
121136DROP TABLE IF EXISTS garfield_edgelist;
@@ -143,23 +158,6 @@ CREATE TABLE garfield_nodelist_formatted_b_pmid AS
143158SELECT a.* ,b .pmid_int FROM garfield_nodelist_formatted_b a
144159LEFT JOIN wos_pmid_mapping b ON a .node_name = b .wos_id ;
145160
146- /*
147- DROP TABLE IF EXISTS garfield_nodelist_formatted_b_pmid_grants;
148- CREATE TABLE garfield_nodelist_formatted_b_pmid_grants AS
149- SELECT a.*,b.project_number FROM garfield_nodelist_formatted_b_pmid a
150- LEFT JOIN exporter_publink b ON a.pmid_int=b.pmid::int;
151-
152- ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN ic varchar(2);
153- ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN nida varchar(10);
154- ALTER TABLE garfield_nodelist_formatted_b_pmid_grants ADD COLUMN other_nih varchar(10);
155-
156- UPDATE garfield_nodelist_formatted_b_pmid_grants SET ic=substring(project_number,4,2);
157- UPDATE garfield_nodelist_formatted_b_pmid_grants SET nida='1' WHERE ic='DA';
158- UPDATE garfield_nodelist_formatted_b_pmid_grants SET nida='0' WHERE nida IS NULL;
159- UPDATE garfield_nodelist_formatted_b_pmid_grants SET other_nih='1' WHERE ic IS NOT NULL AND nida='0';
160- UPDATE garfield_nodelist_formatted_b_pmid_grants SET other_nih='0' WHERE other_nih IS NULL;
161- */
162-
163161DROP TABLE IF EXISTS garfield_nodelist_formatted_b_pmid_grants;
164162CREATE TABLE garfield_nodelist_formatted_b_pmid_grants AS
165163SELECT
@@ -218,10 +216,11 @@ COPY (
218216 publication_year AS " publication_year:int" ,
219217 total_citation_count AS " total_citations:int"
220218 FROM chackoge .garfield_nodelist_final_citation
221- ) TO ' /tmp/garfield_nodelist_final .csv' WITH (FORMAT CSV, HEADER);
219+ ) TO ' /tmp/garfield_nodelist_2g_final .csv' WITH (FORMAT CSV, HEADER);
222220
223221COPY (
224222 SELECT source AS " :START_ID" ,
225223 target AS " :END_ID"
226224 FROM chackoge .garfield_edgelist
227- ) TO ' /tmp/garfield_edgelist_final.csv' WITH (FORMAT CSV, HEADER);
225+ ) TO ' /tmp/garfield_edgelist_2g_final.csv' WITH (FORMAT CSV, HEADER);
226+
0 commit comments