Skip to content

Commit 264166a

Browse files
Merge pull request nikolamilosevic86#6 from dbmi-pitt/master
Some of these changes might be useful for the main - not sure
2 parents 5d38a92 + b8fdb3c commit 264166a

34 files changed

+38074
-111
lines changed

DataBaseFileDrugs.sql

Lines changed: 80 additions & 87 deletions
Original file line numberDiff line numberDiff line change
@@ -1,132 +1,126 @@
1-
-- MySQL Script generated by MySQL Workbench
2-
-- 02/16/16 11:27:32
3-
-- Model: New Model Version: 1.0
1+
-- MySQL Script to generate SQL database for the Table Annotator
2+
--
3+
-- NOTE: It is up to you what database you load these tables into!
4+
--
45
SET @OLD_UNIQUE_CHECKS=@@UNIQUE_CHECKS, UNIQUE_CHECKS=0;
56
SET @OLD_FOREIGN_KEY_CHECKS=@@FOREIGN_KEY_CHECKS, FOREIGN_KEY_CHECKS=0;
67
SET @OLD_SQL_MODE=@@SQL_MODE, SQL_MODE='TRADITIONAL,ALLOW_INVALID_DATES';
78

89
-- -----------------------------------------------------
9-
-- Schema table_db_drugs
10+
-- Table `Article`
1011
-- -----------------------------------------------------
11-
DROP SCHEMA IF EXISTS `table_db_drugs` ;
12-
CREATE SCHEMA IF NOT EXISTS `table_db_drugs` DEFAULT CHARACTER SET utf8 COLLATE utf8_general_ci ;
13-
USE `table_db_drugs` ;
12+
DROP TABLE IF EXISTS `Article` ;
1413

15-
-- -----------------------------------------------------
16-
-- Table `table_db_drugs`.`Article`
17-
-- -----------------------------------------------------
18-
DROP TABLE IF EXISTS `table_db_drugs`.`Article` ;
19-
20-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Article` (
14+
CREATE TABLE IF NOT EXISTS `Article` (
2115
`idArticle` INT NOT NULL AUTO_INCREMENT,
2216
`PMCID` VARCHAR(50) NULL,
2317
`PMID` VARCHAR(45) NULL,
2418
`pissn` VARCHAR(45) NULL,
2519
`eissn` VARCHAR(45) NULL,
26-
`Title` VARCHAR(500) NULL,
27-
`Abstract` VARCHAR(3000) NULL,
28-
`JournalName` VARCHAR(145) NULL,
29-
`JournalPublisherName` VARCHAR(245) NULL,
30-
`JournalPublisherLocation` VARCHAR(200) NULL,
31-
`Source` VARCHAR(100) NULL,
32-
`SpecId` VARCHAR(120) NULL,
33-
`PlainText` VARCHAR(10000) NULL,
20+
`Title` VARCHAR(2000) NULL,
21+
`Abstract` VARCHAR(5000) NULL,
22+
`JournalName` VARCHAR(2000) NULL,
23+
`JournalPublisherName` VARCHAR(2000) NULL,
24+
`JournalPublisherLocation` VARCHAR(5000) NULL,
25+
`Source` VARCHAR(500) NULL,
26+
`SpecId` VARCHAR(500) NULL,
27+
`PlainText` LONGTEXT NULL,
3428
PRIMARY KEY (`idArticle`))
3529
ENGINE = InnoDB;
3630

3731

3832
-- -----------------------------------------------------
39-
-- Table `table_db_drugs`.`Author`
33+
-- Table `Author`
4034
-- -----------------------------------------------------
41-
DROP TABLE IF EXISTS `table_db_drugs`.`Author` ;
35+
DROP TABLE IF EXISTS `Author` ;
4236

43-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Author` (
37+
CREATE TABLE IF NOT EXISTS `Author` (
4438
`idAuthor` INT NOT NULL AUTO_INCREMENT,
45-
`FirstName` VARCHAR(45) NULL,
46-
`LastName` VARCHAR(100) NULL,
39+
`FirstName` VARCHAR(200) NULL,
40+
`LastName` VARCHAR(200) NULL,
4741
`Article_idArticle` INT NOT NULL,
4842
PRIMARY KEY (`idAuthor`),
4943
INDEX `fk_Author_Article1_idx` (`Article_idArticle` ASC),
5044
CONSTRAINT `fk_Author_Article1`
5145
FOREIGN KEY (`Article_idArticle`)
52-
REFERENCES `table_db_drugs`.`Article` (`idArticle`)
46+
REFERENCES `Article` (`idArticle`)
5347
ON DELETE NO ACTION
5448
ON UPDATE NO ACTION)
5549
ENGINE = InnoDB;
5650

5751

5852
-- -----------------------------------------------------
59-
-- Table `table_db_drugs`.`ArtTable`
53+
-- Table `ArtTable`
6054
-- -----------------------------------------------------
61-
DROP TABLE IF EXISTS `table_db_drugs`.`ArtTable` ;
55+
DROP TABLE IF EXISTS `ArtTable` ;
6256

63-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`ArtTable` (
57+
CREATE TABLE IF NOT EXISTS `ArtTable` (
6458
`idTable` INT NOT NULL AUTO_INCREMENT,
65-
`TableOrder` VARCHAR(145) NULL,
66-
`TableCaption` VARCHAR(545) NULL,
67-
`TableFooter` VARCHAR(1445) NULL,
59+
`TableOrder` VARCHAR(500) NULL,
60+
`TableCaption` VARCHAR(5000) NULL,
61+
`TableFooter` VARCHAR(5000) NULL,
6862
`StructureType` VARCHAR(45) NULL,
6963
`PragmaticType` VARCHAR(45) NULL,
7064
`HasXML` VARCHAR(40) NULL,
7165
`Article_idArticle` INT NOT NULL,
72-
`Section` VARCHAR(245) NULL,
66+
`Section` VARCHAR(1000) NULL,
7367
PRIMARY KEY (`idTable`),
7468
INDEX `fk_Table_Article1_idx` (`Article_idArticle` ASC),
7569
CONSTRAINT `fk_Table_Article1`
7670
FOREIGN KEY (`Article_idArticle`)
77-
REFERENCES `table_db_drugs`.`Article` (`idArticle`)
71+
REFERENCES `Article` (`idArticle`)
7872
ON DELETE NO ACTION
7973
ON UPDATE NO ACTION)
8074
ENGINE = InnoDB;
8175

8276

8377
-- -----------------------------------------------------
84-
-- Table `table_db_drugs`.`Cell`
78+
-- Table `Cell`
8579
-- -----------------------------------------------------
86-
DROP TABLE IF EXISTS `table_db_drugs`.`Cell` ;
80+
DROP TABLE IF EXISTS `Cell` ;
8781

88-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Cell` (
82+
CREATE TABLE IF NOT EXISTS `Cell` (
8983
`idCell` INT NOT NULL AUTO_INCREMENT,
90-
`CellID` VARCHAR(45) NULL,
91-
`CellType` VARCHAR(45) NULL,
84+
`CellID` VARCHAR(200) NULL,
85+
`CellType` VARCHAR(200) NULL,
9286
`Table_idTable` INT NOT NULL,
9387
`RowN` INT NULL,
9488
`ColumnN` INT NULL,
95-
`HeaderRef` VARCHAR(45) NULL,
96-
`StubRef` VARCHAR(45) NULL,
97-
`SuperRowRef` VARCHAR(45) NULL,
98-
`Content` VARCHAR(545) NULL,
99-
`WholeHeader` VARCHAR(645) NULL,
100-
`WholeStub` VARCHAR(655) NULL,
101-
`WholeSuperRow` VARCHAR(645) NULL,
89+
`HeaderRef` VARCHAR(200) NULL,
90+
`StubRef` VARCHAR(200) NULL,
91+
`SuperRowRef` VARCHAR(200) NULL,
92+
`Content` VARCHAR(5000) NULL,
93+
`WholeHeader` VARCHAR(5000) NULL,
94+
`WholeStub` VARCHAR(5000) NULL,
95+
`WholeSuperRow` VARCHAR(5000) NULL,
10296
PRIMARY KEY (`idCell`),
10397
INDEX `fk_Cell_Table1_idx` (`Table_idTable` ASC),
10498
CONSTRAINT `fk_Cell_Table1`
10599
FOREIGN KEY (`Table_idTable`)
106-
REFERENCES `table_db_drugs`.`ArtTable` (`idTable`)
100+
REFERENCES `ArtTable` (`idTable`)
107101
ON DELETE NO ACTION
108102
ON UPDATE NO ACTION)
109103
ENGINE = InnoDB;
110104

111105

112106
-- -----------------------------------------------------
113-
-- Table `table_db_drugs`.`CellRole`
107+
-- Table `CellRole`
114108
-- -----------------------------------------------------
115-
DROP TABLE IF EXISTS `table_db_drugs`.`CellRole` ;
109+
DROP TABLE IF EXISTS `CellRole` ;
116110

117-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`CellRole` (
111+
CREATE TABLE IF NOT EXISTS `CellRole` (
118112
`idCellRole` INT NOT NULL AUTO_INCREMENT,
119113
`CellRoleName` VARCHAR(45) NULL,
120114
PRIMARY KEY (`idCellRole`))
121115
ENGINE = InnoDB;
122116

123117

124118
-- -----------------------------------------------------
125-
-- Table `table_db_drugs`.`CellRoles`
119+
-- Table `CellRoles`
126120
-- -----------------------------------------------------
127-
DROP TABLE IF EXISTS `table_db_drugs`.`CellRoles` ;
121+
DROP TABLE IF EXISTS `CellRoles` ;
128122

129-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`CellRoles` (
123+
CREATE TABLE IF NOT EXISTS `CellRoles` (
130124
`idCellRoles` INT NOT NULL AUTO_INCREMENT,
131125
`CellRole_idCellRole` INT NOT NULL,
132126
`Cell_idCell` INT NOT NULL,
@@ -135,91 +129,91 @@ CREATE TABLE IF NOT EXISTS `table_db_drugs`.`CellRoles` (
135129
INDEX `fk_CellRoles_Cell1_idx` (`Cell_idCell` ASC),
136130
CONSTRAINT `fk_CellRoles_CellRole1`
137131
FOREIGN KEY (`CellRole_idCellRole`)
138-
REFERENCES `table_db_drugs`.`CellRole` (`idCellRole`)
132+
REFERENCES `CellRole` (`idCellRole`)
139133
ON DELETE NO ACTION
140134
ON UPDATE NO ACTION,
141135
CONSTRAINT `fk_CellRoles_Cell1`
142136
FOREIGN KEY (`Cell_idCell`)
143-
REFERENCES `table_db_drugs`.`Cell` (`idCell`)
137+
REFERENCES `Cell` (`idCell`)
144138
ON DELETE NO ACTION
145139
ON UPDATE NO ACTION)
146140
ENGINE = InnoDB;
147141

148142

149143
-- -----------------------------------------------------
150-
-- Table `table_db_drugs`.`Annotation`
144+
-- Table `Annotation`
151145
-- -----------------------------------------------------
152-
DROP TABLE IF EXISTS `table_db_drugs`.`Annotation` ;
146+
DROP TABLE IF EXISTS `Annotation` ;
153147

154-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Annotation` (
148+
CREATE TABLE IF NOT EXISTS `Annotation` (
155149
`idAnnotation` INT NOT NULL AUTO_INCREMENT,
156-
`Content` VARCHAR(245) NULL,
150+
`Content` VARCHAR(1000) NULL,
157151
`Start` INT NULL,
158152
`End` INT NULL,
159-
`AnnotationID` VARCHAR(245) NULL,
160-
`AnnotationSchemaVersion` VARCHAR(245) NULL,
161-
`AnnotationDescription` VARCHAR(500) NULL,
162-
`AnnotationURL` VARCHAR(245) NULL,
163-
`AgentName` VARCHAR(345) NULL,
153+
`AnnotationID` VARCHAR(500) NULL,
154+
`AnnotationSchemaVersion` VARCHAR(500) NULL,
155+
`AnnotationDescription` VARCHAR(1500) NULL,
156+
`AnnotationURL` VARCHAR(1000) NULL,
157+
`AgentName` VARCHAR(500) NULL,
164158
`AgentType` VARCHAR(45) NULL,
165-
`EnvironmentDescription` VARCHAR(505) NULL,
159+
`EnvironmentDescription` VARCHAR(1000) NULL,
166160
`DateOfAction` DATETIME NULL,
167-
`Location` VARCHAR(200) NULL,
161+
`Location` VARCHAR(500) NULL,
168162
`Cell_idCell` INT NOT NULL,
169163
PRIMARY KEY (`idAnnotation`),
170164
INDEX `fk_Annotation_Cell1_idx` (`Cell_idCell` ASC),
171165
CONSTRAINT `fk_Annotation_Cell1`
172166
FOREIGN KEY (`Cell_idCell`)
173-
REFERENCES `table_db_drugs`.`Cell` (`idCell`)
167+
REFERENCES `Cell` (`idCell`)
174168
ON DELETE NO ACTION
175169
ON UPDATE NO ACTION)
176170
ENGINE = InnoDB;
177171

178172

179173
-- -----------------------------------------------------
180-
-- Table `table_db_drugs`.`Affiliation`
174+
-- Table `Affiliation`
181175
-- -----------------------------------------------------
182-
DROP TABLE IF EXISTS `table_db_drugs`.`Affiliation` ;
176+
DROP TABLE IF EXISTS `Affiliation` ;
183177

184-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Affiliation` (
178+
CREATE TABLE IF NOT EXISTS `Affiliation` (
185179
`idAffiliation` INT NOT NULL AUTO_INCREMENT,
186180
`AffiliationName` VARCHAR(345) NULL,
187181
`Author_idAuthor` INT NOT NULL,
188182
PRIMARY KEY (`idAffiliation`),
189183
INDEX `fk_Affiliation_Author1_idx` (`Author_idAuthor` ASC),
190184
CONSTRAINT `fk_Affiliation_Author1`
191185
FOREIGN KEY (`Author_idAuthor`)
192-
REFERENCES `table_db_drugs`.`Author` (`idAuthor`)
186+
REFERENCES `Author` (`idAuthor`)
193187
ON DELETE NO ACTION
194188
ON UPDATE NO ACTION)
195189
ENGINE = InnoDB;
196190

197191

198192
-- -----------------------------------------------------
199-
-- Table `table_db_drugs`.`Email`
193+
-- Table `Email`
200194
-- -----------------------------------------------------
201-
DROP TABLE IF EXISTS `table_db_drugs`.`Email` ;
195+
DROP TABLE IF EXISTS `Email` ;
202196

203-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`Email` (
197+
CREATE TABLE IF NOT EXISTS `Email` (
204198
`idEmail` INT NOT NULL AUTO_INCREMENT,
205-
`Email` VARCHAR(245) NULL,
199+
`Email` VARCHAR(1000) NULL,
206200
`Author_idAuthor` INT NOT NULL,
207201
PRIMARY KEY (`idEmail`, `Author_idAuthor`),
208202
INDEX `fk_Email_Author1_idx` (`Author_idAuthor` ASC),
209203
CONSTRAINT `fk_Email_Author1`
210204
FOREIGN KEY (`Author_idAuthor`)
211-
REFERENCES `table_db_drugs`.`Author` (`idAuthor`)
205+
REFERENCES `Author` (`idAuthor`)
212206
ON DELETE NO ACTION
213207
ON UPDATE NO ACTION)
214208
ENGINE = InnoDB;
215209

216210

217211
-- -----------------------------------------------------
218-
-- Table `table_db_drugs`.`OriginalArticle`
212+
-- Table `OriginalArticle`
219213
-- -----------------------------------------------------
220-
DROP TABLE IF EXISTS `table_db_drugs`.`OriginalArticle` ;
214+
DROP TABLE IF EXISTS `OriginalArticle` ;
221215

222-
CREATE TABLE IF NOT EXISTS `table_db_drugs`.`OriginalArticle` (
216+
CREATE TABLE IF NOT EXISTS `OriginalArticle` (
223217
`idOriginalArticle` INT NOT NULL AUTO_INCREMENT,
224218
`PMCID` VARCHAR(50) NULL,
225219
`PMID` VARCHAR(45) NULL,
@@ -232,7 +226,7 @@ CREATE TABLE IF NOT EXISTS `table_db_drugs`.`OriginalArticle` (
232226
INDEX `fk_OriginalArticle_Article1_idx` (`Article_idArticle` ASC),
233227
CONSTRAINT `fk_OriginalArticle_Article1`
234228
FOREIGN KEY (`Article_idArticle`)
235-
REFERENCES `table_db_drugs`.`Article` (`idArticle`)
229+
REFERENCES `Article` (`idArticle`)
236230
ON DELETE NO ACTION
237231
ON UPDATE NO ACTION)
238232
ENGINE = InnoDB;
@@ -243,14 +237,13 @@ SET FOREIGN_KEY_CHECKS=@OLD_FOREIGN_KEY_CHECKS;
243237
SET UNIQUE_CHECKS=@OLD_UNIQUE_CHECKS;
244238

245239
-- -----------------------------------------------------
246-
-- Data for table `table_db_drugs`.`CellRole`
240+
-- Data for table `CellRole`
247241
-- -----------------------------------------------------
248242
START TRANSACTION;
249-
USE `table_db_drugs`;
250-
INSERT INTO `table_db_drugs`.`CellRole` (`idCellRole`, `CellRoleName`) VALUES (1, 'Header');
251-
INSERT INTO `table_db_drugs`.`CellRole` (`idCellRole`, `CellRoleName`) VALUES (2, 'Stub');
252-
INSERT INTO `table_db_drugs`.`CellRole` (`idCellRole`, `CellRoleName`) VALUES (3, 'Data');
253-
INSERT INTO `table_db_drugs`.`CellRole` (`idCellRole`, `CellRoleName`) VALUES (4, 'SuperRow');
243+
INSERT INTO `CellRole` (`idCellRole`, `CellRoleName`) VALUES (1, 'Header');
244+
INSERT INTO `CellRole` (`idCellRole`, `CellRoleName`) VALUES (2, 'Stub');
245+
INSERT INTO `CellRole` (`idCellRole`, `CellRoleName`) VALUES (3, 'Data');
246+
INSERT INTO `CellRole` (`idCellRole`, `CellRoleName`) VALUES (4, 'SuperRow');
254247

255248
COMMIT;
256249

analysis-UPCI/README

Whitespace-only changes.

annotation/check_annotated_setIDs.py

Lines changed: 43 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,43 @@
1+
import mysql.connector
2+
import csv
3+
import re
4+
5+
# Get database connection settings
6+
settings = []
7+
with open("settings.cfg", "r+") as config_file:
8+
hold = config_file.readlines()
9+
for h in hold:
10+
splits = h.split(";")
11+
line = []
12+
line.append(splits[0])
13+
line.append(splits[1])
14+
settings.append(line)
15+
16+
for line in settings:
17+
if "database_username" in line[0]:
18+
usr = line[1]
19+
if "database_password" in line[0]:
20+
pword = line[1]
21+
if "database_host" in line[0]:
22+
hst = line[1]
23+
if "database_name" in line[0]:
24+
dbname = line[1]
25+
if "database_port" in line[0]:
26+
dbport = line[1]
27+
28+
cnx = mysql.connector.connect(user=usr, password=pword, host=hst, database=dbname)
29+
30+
cursor = cnx.cursor()
31+
32+
setIDs_already_annotated = []
33+
34+
check_query = (
35+
"SELECT DISTINCT SpecId FROM Article; ")
36+
37+
cursor.execute(check_query)
38+
39+
40+
with open('setIDs-already-annotated.txt', 'wb') as outfile:
41+
for s in cursor:
42+
outfile.write("%s\n" % s)
43+

0 commit comments

Comments
 (0)