line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# MetaMap::DataStructures::Citation |
2
|
|
|
|
|
|
|
# (Last Updated $Id: Citation.pm,v 1.80 2016/01/07 22:49:33 btmcinnes Exp $) |
3
|
|
|
|
|
|
|
# |
4
|
|
|
|
|
|
|
# Perl module that provides a perl interface to the |
5
|
|
|
|
|
|
|
# Unified Medical Language System (UMLS) |
6
|
|
|
|
|
|
|
# |
7
|
|
|
|
|
|
|
# Copyright (c) 2016 |
8
|
|
|
|
|
|
|
# |
9
|
|
|
|
|
|
|
# Sam Henry, Virginia Commonwealth University |
10
|
|
|
|
|
|
|
# henryst at vcu.edu |
11
|
|
|
|
|
|
|
# |
12
|
|
|
|
|
|
|
# Bridget T. McInnes, Virginia Commonwealth University |
13
|
|
|
|
|
|
|
# btmcinnes at vcu.edu |
14
|
|
|
|
|
|
|
# |
15
|
|
|
|
|
|
|
# This program is free software; you can redistribute it and/or |
16
|
|
|
|
|
|
|
# modify it under the terms of the GNU General Public License |
17
|
|
|
|
|
|
|
# as published by the Free Software Foundation; either version 2 |
18
|
|
|
|
|
|
|
# of the License, or (at your option) any later version. |
19
|
|
|
|
|
|
|
# |
20
|
|
|
|
|
|
|
# This program is distributed in the hope that it will be useful, |
21
|
|
|
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of |
22
|
|
|
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
23
|
|
|
|
|
|
|
# GNU General Public License for more details. |
24
|
|
|
|
|
|
|
# |
25
|
|
|
|
|
|
|
# You should have received a copy of the GNU General Public License |
26
|
|
|
|
|
|
|
# along with this program; if not, write to |
27
|
|
|
|
|
|
|
# |
28
|
|
|
|
|
|
|
# The Free Software Foundation, Inc., |
29
|
|
|
|
|
|
|
# 59 Temple Place - Suite 330, |
30
|
|
|
|
|
|
|
# Boston, MA 02111-1307, USA. |
31
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
package MetaMap::DataStructures::Citation; |
33
|
1
|
|
|
1
|
|
4
|
use strict; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
21
|
|
34
|
1
|
|
|
1
|
|
3
|
use warnings; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
18
|
|
35
|
|
|
|
|
|
|
|
36
|
1
|
|
|
1
|
|
3
|
use MetaMap::DataStructures::Utterance; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
1139
|
|
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
#---------------------------------------- |
39
|
|
|
|
|
|
|
# constructors |
40
|
|
|
|
|
|
|
#---------------------------------------- |
41
|
|
|
|
|
|
|
# constructor method to create a new Citation object |
42
|
|
|
|
|
|
|
# input : - |
43
|
|
|
|
|
|
|
# output: $self <- a instance of a Citation object |
44
|
|
|
|
|
|
|
sub new { |
45
|
|
|
|
|
|
|
#create and bless self |
46
|
5
|
|
|
5
|
0
|
6
|
my $class = shift; |
47
|
5
|
|
|
|
|
6
|
my $self = {}; |
48
|
5
|
|
|
|
|
9
|
bless $self, $class; |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
#grab input and initialize |
51
|
5
|
|
|
|
|
11
|
$self->{id} = shift; |
52
|
5
|
|
|
|
|
6
|
$self->{utterances} = {}; |
53
|
|
|
|
|
|
|
|
54
|
5
|
|
|
|
|
11
|
return $self; |
55
|
|
|
|
|
|
|
} |
56
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
#----------------------------------------------------------------- |
58
|
|
|
|
|
|
|
# methods |
59
|
|
|
|
|
|
|
#----------------------------------------------------------------- |
60
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
# method summarizes this utterance as a string |
62
|
|
|
|
|
|
|
# input : - |
63
|
|
|
|
|
|
|
# output: $string <- a string describing $self |
64
|
|
|
|
|
|
|
sub toString { |
65
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
66
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
#initiliaze the string |
68
|
0
|
|
|
|
|
0
|
my $string = "citation:\n"; |
69
|
0
|
|
|
|
|
0
|
$string .= " $self->{id}\n"; |
70
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
#add each utterance to the string |
72
|
0
|
|
|
|
|
0
|
my %utterances = %{$self->{utterances}}; |
|
0
|
|
|
|
|
0
|
|
73
|
0
|
|
|
|
|
0
|
foreach my $key(keys %utterances) { |
74
|
0
|
|
|
|
|
0
|
$string .= " ".$utterances{$key}->toString()."\n"; |
75
|
|
|
|
|
|
|
} |
76
|
0
|
|
|
|
|
0
|
return $string; |
77
|
|
|
|
|
|
|
} |
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
# method to compare this citation to another and returns 1 if the two |
80
|
|
|
|
|
|
|
# contain identical information |
81
|
|
|
|
|
|
|
# input : $other <- the citation object to compare against |
82
|
|
|
|
|
|
|
# output: boolean <- 1 if $self and $other are equivalent (contain equivalent |
83
|
|
|
|
|
|
|
# ID's and utterances), else 0 |
84
|
|
|
|
|
|
|
sub equals { |
85
|
|
|
|
|
|
|
#grab input |
86
|
3
|
|
|
3
|
0
|
6
|
my $self = shift; |
87
|
3
|
|
|
|
|
3
|
my $other = shift; |
88
|
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
#compare id's |
90
|
3
|
50
|
|
|
|
10
|
if ($self->{id} ne $other->{id}) { |
91
|
0
|
|
|
|
|
0
|
return 0; |
92
|
|
|
|
|
|
|
} |
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
#compare Utterances |
95
|
3
|
|
|
|
|
3
|
foreach my $keyA(sort _by_utterance keys %{$self->{utterances}}){ |
|
3
|
|
|
|
|
15
|
|
96
|
3
|
|
|
|
|
4
|
my $utteranceA = $self->{utterances}{$keyA}; |
97
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
#check each utterance in B |
99
|
3
|
|
|
|
|
4
|
my $match = 0; |
100
|
3
|
|
|
|
|
5
|
foreach my $keyB(sort _by_utterance keys %{$other->{utterances}}) { |
|
3
|
|
|
|
|
6
|
|
101
|
2
|
|
|
|
|
3
|
my $utteranceB = $self->{utterances}{$keyB}; |
102
|
2
|
50
|
|
|
|
5
|
if ($utteranceA->equals($utteranceB)) { |
103
|
2
|
|
|
|
|
3
|
$match = 1; |
104
|
2
|
|
|
|
|
4
|
last; |
105
|
|
|
|
|
|
|
} |
106
|
|
|
|
|
|
|
} |
107
|
|
|
|
|
|
|
|
108
|
|
|
|
|
|
|
#citationA has no equivalent citation in $other |
109
|
|
|
|
|
|
|
# so citations are not identical |
110
|
3
|
100
|
|
|
|
10
|
if ($match < 1) { |
111
|
1
|
|
|
|
|
4
|
return 0; |
112
|
|
|
|
|
|
|
} |
113
|
|
|
|
|
|
|
} |
114
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
#all tests passed, return true |
116
|
2
|
|
|
|
|
21
|
return 1; |
117
|
|
|
|
|
|
|
} |
118
|
|
|
|
|
|
|
|
119
|
|
|
|
|
|
|
# method to determine if this citation contains the CUI provided as input |
120
|
|
|
|
|
|
|
# returns 1 if this citation contains the CUI, else 0 |
121
|
|
|
|
|
|
|
# input : $cui <- a string CUI code |
122
|
|
|
|
|
|
|
# output: boolean <- 1 if any of $self's utterances contain $cui |
123
|
|
|
|
|
|
|
sub contains { |
124
|
|
|
|
|
|
|
#grab input |
125
|
2
|
|
|
2
|
0
|
11
|
my $self = shift; |
126
|
2
|
|
|
|
|
3
|
my $cui = shift; |
127
|
|
|
|
|
|
|
|
128
|
|
|
|
|
|
|
#check each phrase to see if it contains the CUI |
129
|
2
|
|
|
|
|
4
|
my $containsCUI = 0; |
130
|
2
|
|
|
|
|
1
|
foreach my $key(keys %{$self->{utterances}}) { |
|
2
|
|
|
|
|
5
|
|
131
|
2
|
100
|
|
|
|
6
|
if ($self->{utterances}{$key}->contains($cui)) { |
132
|
1
|
|
|
|
|
1
|
$containsCUI = 1; |
133
|
1
|
|
|
|
|
2
|
last; |
134
|
|
|
|
|
|
|
} |
135
|
|
|
|
|
|
|
} |
136
|
|
|
|
|
|
|
|
137
|
|
|
|
|
|
|
#return the result |
138
|
2
|
|
|
|
|
7
|
return $containsCUI; |
139
|
|
|
|
|
|
|
} |
140
|
|
|
|
|
|
|
|
141
|
|
|
|
|
|
|
# method to add a new utterance to the citation |
142
|
|
|
|
|
|
|
# input : $newUtterance <- the utterance to add to $self |
143
|
|
|
|
|
|
|
# output: - |
144
|
|
|
|
|
|
|
sub addUtterance { |
145
|
9
|
|
|
9
|
0
|
12
|
my $self = shift; |
146
|
9
|
|
|
|
|
9
|
my $newUtterance = shift; |
147
|
|
|
|
|
|
|
|
148
|
9
|
50
|
|
|
|
42
|
if($newUtterance->{id} =~ /((ti|ab)\.[\d]+)/) { |
149
|
9
|
|
|
|
|
1417
|
$self->{utterances}{$1} = $newUtterance; |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
else { |
152
|
0
|
|
|
|
|
0
|
print STDERR "error adding utterance to citation: $newUtterance->{id}\n"; |
153
|
|
|
|
|
|
|
} |
154
|
|
|
|
|
|
|
} |
155
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
# method to sort the utterances by order they appear (title followed |
157
|
|
|
|
|
|
|
# by abstract, number ascending) |
158
|
|
|
|
|
|
|
# (e.g. ti.000.1, ti.000.2, ab.000.1, ab.000.2, ab.000.3) |
159
|
|
|
|
|
|
|
# input : $a, $b <- implicit sort variables, the keys in a hash of utterances |
160
|
|
|
|
|
|
|
# which are the utterance IDs (e.g. ti.0000000.1) |
161
|
|
|
|
|
|
|
# output: integer <- -1 if a is before b, 0 if a and b are same order, |
162
|
|
|
|
|
|
|
# 1 if a is after b |
163
|
|
|
|
|
|
|
sub _by_utterance { |
164
|
|
|
|
|
|
|
#get the utterance type |
165
|
0
|
|
|
0
|
|
0
|
my $a_ab = ($a =~ /ab/); |
166
|
0
|
|
|
|
|
0
|
my $b_ab = ($b =~ /ab/); |
167
|
|
|
|
|
|
|
|
168
|
|
|
|
|
|
|
#check if both are abstracts or titles |
169
|
0
|
0
|
|
|
|
0
|
if ($a_ab == $b_ab) { |
170
|
0
|
|
|
|
|
0
|
$a =~ /(ti|ab)\.([\d]+)/; |
171
|
0
|
|
|
|
|
0
|
my $aNum = ($2); |
172
|
|
|
|
|
|
|
|
173
|
0
|
|
|
|
|
0
|
$b =~ /(ti|ab)\.([\d]+)/; |
174
|
0
|
|
|
|
|
0
|
return $aNum <=> $2; |
175
|
|
|
|
|
|
|
} |
176
|
|
|
|
|
|
|
|
177
|
|
|
|
|
|
|
#check if one is abstract, the other is title |
178
|
0
|
0
|
0
|
|
|
0
|
if ($a_ab && !$b_ab) { |
179
|
0
|
|
|
|
|
0
|
return 1; |
180
|
|
|
|
|
|
|
} |
181
|
0
|
0
|
0
|
|
|
0
|
if (!$a_ab && $b_ab) { |
182
|
0
|
|
|
|
|
0
|
return -1; |
183
|
|
|
|
|
|
|
} |
184
|
|
|
|
|
|
|
} |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
|
187
|
|
|
|
|
|
|
#------------------------------ Get Components ------------------------------ |
188
|
|
|
|
|
|
|
# method to returns an ordered list of Utterances contained by the Citation. |
189
|
|
|
|
|
|
|
# Utterances are ordered by title, abstract, then number in ascending order |
190
|
|
|
|
|
|
|
# (e.g. ti.000.1, ti.000.2, ab.000.1, ab.000.2, ab.000.3) |
191
|
|
|
|
|
|
|
# input : - |
192
|
|
|
|
|
|
|
# output: \@utterances <- $self's utterances ordered as they appear in the |
193
|
|
|
|
|
|
|
# original text of $self |
194
|
|
|
|
|
|
|
sub getOrderedUtterances { |
195
|
|
|
|
|
|
|
#initialize |
196
|
2
|
|
|
2
|
0
|
69
|
my $self = shift; |
197
|
2
|
|
|
|
|
4
|
my @utterances = (); |
198
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
#add concepts in sorted order |
200
|
2
|
|
|
|
|
3
|
foreach my $key(sort _by_utterance keys %{$self->{utterances}}) { |
|
2
|
|
|
|
|
10
|
|
201
|
2
|
|
|
|
|
3
|
push @utterances, $self->{utterances}{$key}; |
202
|
|
|
|
|
|
|
} |
203
|
2
|
|
|
|
|
4
|
return \@utterances; |
204
|
|
|
|
|
|
|
} |
205
|
|
|
|
|
|
|
|
206
|
|
|
|
|
|
|
# method to get an array of concepts that appear in the citation |
207
|
|
|
|
|
|
|
# (not necassarily ordered). Use this method if order doesn't matter for |
208
|
|
|
|
|
|
|
# increased performance. |
209
|
|
|
|
|
|
|
# input : - |
210
|
|
|
|
|
|
|
# output: \@concepts <- a list of concept objects |
211
|
|
|
|
|
|
|
sub getConcepts { |
212
|
|
|
|
|
|
|
#initialize |
213
|
1
|
|
|
1
|
0
|
11
|
my $self = shift; |
214
|
1
|
|
|
|
|
1
|
my @concepts = (); |
215
|
|
|
|
|
|
|
|
216
|
|
|
|
|
|
|
#add concepts in sorted order |
217
|
1
|
|
|
|
|
2
|
foreach my $key(keys %{$self->{utterances}}) { |
|
1
|
|
|
|
|
2
|
|
218
|
1
|
|
|
|
|
2
|
push @concepts, @{ $self->{utterances}{$key}->getConcepts() }; |
|
1
|
|
|
|
|
3
|
|
219
|
|
|
|
|
|
|
} |
220
|
1
|
|
|
|
|
3
|
return \@concepts; |
221
|
|
|
|
|
|
|
} |
222
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
# method to get the unique concepts and return a hash of |
224
|
|
|
|
|
|
|
# concepts, CUIs are the keys |
225
|
|
|
|
|
|
|
# input : - |
226
|
|
|
|
|
|
|
# output: \%concepts <- $self's unique concepts with the key as the concept's |
227
|
|
|
|
|
|
|
# CUI. CUIs are considered unique by their CUI code only (e.g. C0000000 |
228
|
|
|
|
|
|
|
# and C0000000 are considered the same even if there are two different |
229
|
|
|
|
|
|
|
# Concept.pm objects associated with them) |
230
|
|
|
|
|
|
|
sub getUniqueConcepts { |
231
|
1
|
|
|
1
|
0
|
182
|
my $self = shift; |
232
|
1
|
|
|
|
|
3
|
my %concepts = (); |
233
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
#update concepts |
235
|
1
|
|
|
|
|
1
|
foreach my $key(keys %{$self->{utterances}}) { |
|
1
|
|
|
|
|
4
|
|
236
|
1
|
|
|
|
|
4
|
my $utteranceConceptsRef = $self->{utterances}{$key}->getConcepts(); |
237
|
1
|
|
|
|
|
1
|
foreach my $concept(@{ $utteranceConceptsRef }) { |
|
1
|
|
|
|
|
2
|
|
238
|
80
|
|
|
|
|
59
|
my $cui = $concept->{cui}; |
239
|
80
|
100
|
|
|
|
96
|
if (!exists $concepts{$cui}) { |
240
|
75
|
|
|
|
|
89
|
$concepts{$cui} = $concept; |
241
|
|
|
|
|
|
|
} |
242
|
|
|
|
|
|
|
} |
243
|
|
|
|
|
|
|
} |
244
|
1
|
|
|
|
|
18
|
return \%concepts; |
245
|
|
|
|
|
|
|
} |
246
|
|
|
|
|
|
|
|
247
|
|
|
|
|
|
|
# method to get the an array of concepts that appear in the citation |
248
|
|
|
|
|
|
|
# concepts are ordered as they appear in the utterance |
249
|
|
|
|
|
|
|
# however where there are multiple mappings for a single |
250
|
|
|
|
|
|
|
# token those two concepts will appear adjacent to one another |
251
|
|
|
|
|
|
|
# input : - |
252
|
|
|
|
|
|
|
# output: \@conceptList <- an array of arrays, where each sub-array contains a |
253
|
|
|
|
|
|
|
# list of 1 or more concept objects. Where more than |
254
|
|
|
|
|
|
|
# one concept object occurrs it means the token to |
255
|
|
|
|
|
|
|
# concept mapping was ambiguous. Arrays are ordered as |
256
|
|
|
|
|
|
|
# the tokens occurr in the utterance. |
257
|
|
|
|
|
|
|
sub getOrderedConcepts { |
258
|
|
|
|
|
|
|
#initialize |
259
|
1
|
|
|
1
|
0
|
94
|
my $self = shift; |
260
|
1
|
|
|
|
|
2
|
my @conceptsList = (); |
261
|
|
|
|
|
|
|
|
262
|
|
|
|
|
|
|
#add concepts in sorted order |
263
|
1
|
|
|
|
|
2
|
foreach my $key(sort _by_utterance keys %{$self->{utterances}}) { |
|
1
|
|
|
|
|
3
|
|
264
|
1
|
|
|
|
|
2
|
push @conceptsList, @{ $self->{utterances}{$key}->getOrderedConcepts() }; |
|
1
|
|
|
|
|
4
|
|
265
|
|
|
|
|
|
|
} |
266
|
1
|
|
|
|
|
2
|
return \@conceptsList; |
267
|
|
|
|
|
|
|
} |
268
|
|
|
|
|
|
|
|
269
|
|
|
|
|
|
|
# method to get a list of ordered mappings. There may be multiple |
270
|
|
|
|
|
|
|
# mappings for a single utterance, but they will appear in correct |
271
|
|
|
|
|
|
|
# utterance order |
272
|
|
|
|
|
|
|
# input : - |
273
|
|
|
|
|
|
|
# output: \@mappings <- a list of mapping objects ordered by their occurence in |
274
|
|
|
|
|
|
|
# $self. |
275
|
|
|
|
|
|
|
sub getOrderedMappings { |
276
|
|
|
|
|
|
|
#initialize |
277
|
1
|
|
|
1
|
0
|
100
|
my $self = shift; |
278
|
1
|
|
|
|
|
1
|
my @mappings = (); |
279
|
|
|
|
|
|
|
|
280
|
|
|
|
|
|
|
#add mappings in sorted order |
281
|
1
|
|
|
|
|
2
|
foreach my $key(sort _by_utterance keys %{$self->{utterances}}) { |
|
1
|
|
|
|
|
4
|
|
282
|
1
|
|
|
|
|
1
|
push @mappings, @{ $self->{utterances}{$key}->getMappings() }; |
|
1
|
|
|
|
|
4
|
|
283
|
|
|
|
|
|
|
} |
284
|
1
|
|
|
|
|
2
|
return \@mappings; |
285
|
|
|
|
|
|
|
} |
286
|
|
|
|
|
|
|
|
287
|
|
|
|
|
|
|
# method to get all the mappings of the citation (not necassarily ordered) |
288
|
|
|
|
|
|
|
# input : - |
289
|
|
|
|
|
|
|
# output: \@mappings <- a list of mapping objects |
290
|
|
|
|
|
|
|
sub getMappings { |
291
|
|
|
|
|
|
|
#initialize |
292
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
293
|
0
|
|
|
|
|
0
|
my @mappings = (); |
294
|
|
|
|
|
|
|
|
295
|
|
|
|
|
|
|
#add mappings in sorted order |
296
|
0
|
|
|
|
|
0
|
foreach my $key(keys %{$self->{utterances}}) { |
|
0
|
|
|
|
|
0
|
|
297
|
0
|
|
|
|
|
0
|
push @mappings, @{ $self->{utterances}{$key}->getMappings() }; |
|
0
|
|
|
|
|
0
|
|
298
|
|
|
|
|
|
|
} |
299
|
0
|
|
|
|
|
0
|
return \@mappings; |
300
|
|
|
|
|
|
|
} |
301
|
|
|
|
|
|
|
|
302
|
|
|
|
|
|
|
# method to get an array of ordered tokens as they appear in the citation |
303
|
|
|
|
|
|
|
# input : - |
304
|
|
|
|
|
|
|
# output: \@tokens <- a list of token objects ordered by their appearance in |
305
|
|
|
|
|
|
|
# $self |
306
|
|
|
|
|
|
|
sub getOrderedTokens |
307
|
|
|
|
|
|
|
{ |
308
|
|
|
|
|
|
|
#initialize |
309
|
3
|
|
|
3
|
0
|
165
|
my $self = shift; |
310
|
3
|
|
|
|
|
5
|
my @tokens = (); |
311
|
|
|
|
|
|
|
|
312
|
|
|
|
|
|
|
#add words in sorted order |
313
|
3
|
|
|
|
|
3
|
foreach my $key(sort _by_utterance keys %{$self->{utterances}}) { |
|
3
|
|
|
|
|
9
|
|
314
|
2
|
|
|
|
|
1
|
push @tokens, @{ $self->{utterances}{$key}->getTokens() }; |
|
2
|
|
|
|
|
8
|
|
315
|
|
|
|
|
|
|
} |
316
|
3
|
|
|
|
|
5
|
return \@tokens; |
317
|
|
|
|
|
|
|
} |
318
|
|
|
|
|
|
|
|
319
|
|
|
|
|
|
|
# method to get an array of tokens. Tokens are not necassarily in order |
320
|
|
|
|
|
|
|
# input : - |
321
|
|
|
|
|
|
|
# output: \@tokens <- a list of token objects |
322
|
|
|
|
|
|
|
sub getTokens |
323
|
|
|
|
|
|
|
{ |
324
|
|
|
|
|
|
|
#initialize |
325
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
326
|
0
|
|
|
|
|
0
|
my @tokens = (); |
327
|
|
|
|
|
|
|
|
328
|
|
|
|
|
|
|
#add words in sorted order |
329
|
0
|
|
|
|
|
0
|
foreach my $key(keys %{$self->{utterances}}) { |
|
0
|
|
|
|
|
0
|
|
330
|
0
|
|
|
|
|
0
|
push @tokens, @{ $self->{utterances}{$key}->getTokens() }; |
|
0
|
|
|
|
|
0
|
|
331
|
|
|
|
|
|
|
} |
332
|
0
|
|
|
|
|
0
|
return \@tokens; |
333
|
|
|
|
|
|
|
} |
334
|
|
|
|
|
|
|
|
335
|
|
|
|
|
|
|
#---------------------- Has Parts (title or abstract) ------------------------- |
336
|
|
|
|
|
|
|
# method to determine if the citation contains any title utterances |
337
|
|
|
|
|
|
|
# input : - |
338
|
|
|
|
|
|
|
# output: boolean <- 1 if $self contains a title utterance, else 0 |
339
|
|
|
|
|
|
|
sub hasTitle |
340
|
|
|
|
|
|
|
{ |
341
|
1
|
|
|
1
|
0
|
518
|
my $self = shift; |
342
|
1
|
|
|
|
|
3
|
return $self->_hasPart('ti'); |
343
|
|
|
|
|
|
|
|
344
|
|
|
|
|
|
|
} |
345
|
|
|
|
|
|
|
|
346
|
|
|
|
|
|
|
# method to determine if the citation contains any abstract utterances |
347
|
|
|
|
|
|
|
# input : - |
348
|
|
|
|
|
|
|
# output: boolean <- 1 if $self contains an abstract utterance, else 0 |
349
|
|
|
|
|
|
|
sub hasAbstract |
350
|
|
|
|
|
|
|
{ |
351
|
1
|
|
|
1
|
0
|
4
|
my $self = shift; |
352
|
1
|
|
|
|
|
2
|
return $self->_hasPart('ab'); |
353
|
|
|
|
|
|
|
|
354
|
|
|
|
|
|
|
} |
355
|
|
|
|
|
|
|
|
356
|
|
|
|
|
|
|
# method to determine if the citation contains any utterances of the |
357
|
|
|
|
|
|
|
# tag ('ti' or 'ab') |
358
|
|
|
|
|
|
|
# input : $tag <- the utterance tag to check for, should be 'ti' or 'ab' |
359
|
|
|
|
|
|
|
# output: boolean <- 1 if $self contains an utterance with the $tag, else 0 |
360
|
|
|
|
|
|
|
sub _hasPart |
361
|
|
|
|
|
|
|
{ |
362
|
2
|
|
|
2
|
|
3
|
my $self = shift; |
363
|
2
|
|
|
|
|
2
|
my $tag = shift; |
364
|
|
|
|
|
|
|
|
365
|
|
|
|
|
|
|
#get the utterances that match the tag |
366
|
2
|
|
|
|
|
3
|
foreach my $key(keys %{$self->{utterances}}) { |
|
2
|
|
|
|
|
4
|
|
367
|
2
|
50
|
|
|
|
10
|
if ($key =~ /(ti|ab)/) { |
368
|
2
|
100
|
|
|
|
7
|
if ($1 eq $tag) { |
369
|
|
|
|
|
|
|
#tag found, returning true |
370
|
1
|
|
|
|
|
3
|
return 1; |
371
|
|
|
|
|
|
|
} |
372
|
|
|
|
|
|
|
} |
373
|
|
|
|
|
|
|
} |
374
|
|
|
|
|
|
|
#no matching tags found, returning false |
375
|
1
|
|
|
|
|
3
|
return 0; |
376
|
|
|
|
|
|
|
} |
377
|
|
|
|
|
|
|
#---------------------------------------------------------------------------- |
378
|
|
|
|
|
|
|
|
379
|
|
|
|
|
|
|
|
380
|
|
|
|
|
|
|
#------------------ Get Parts (Title or Abstract) --------------------- |
381
|
|
|
|
|
|
|
# method to create a new citation containing just the title of this citation |
382
|
|
|
|
|
|
|
# input : - |
383
|
|
|
|
|
|
|
# output: $part <- a citation object containing all utterances of $self's title |
384
|
|
|
|
|
|
|
sub getTitle |
385
|
|
|
|
|
|
|
{ |
386
|
2
|
|
|
2
|
0
|
25
|
my $self = shift; |
387
|
2
|
|
|
|
|
6
|
return $self->_getPart('ti'); |
388
|
|
|
|
|
|
|
} |
389
|
|
|
|
|
|
|
|
390
|
|
|
|
|
|
|
# method to create a new citation containing just the abstract of this citation |
391
|
|
|
|
|
|
|
# input : - |
392
|
|
|
|
|
|
|
# output: $part <- a citation object containing all utterances of $self's |
393
|
|
|
|
|
|
|
# abstract |
394
|
|
|
|
|
|
|
sub getAbstract |
395
|
|
|
|
|
|
|
{ |
396
|
2
|
|
|
2
|
0
|
100
|
my $self = shift; |
397
|
2
|
|
|
|
|
5
|
return $self->_getPart('ab'); |
398
|
|
|
|
|
|
|
} |
399
|
|
|
|
|
|
|
|
400
|
|
|
|
|
|
|
# method to get a part of this citation (title or abstract) |
401
|
|
|
|
|
|
|
# input is a match string, either 'ti' or 'ab' |
402
|
|
|
|
|
|
|
# input : $tag <- the utterance tag to extract, should be 'ti' or 'ab' |
403
|
|
|
|
|
|
|
# output: $part <- a citation object containing all utterance of $self |
404
|
|
|
|
|
|
|
# containing the $tag in their ID |
405
|
|
|
|
|
|
|
sub _getPart |
406
|
|
|
|
|
|
|
{ |
407
|
4
|
|
|
4
|
|
5
|
my $self = shift; |
408
|
4
|
|
|
|
|
5
|
my $tag = shift; |
409
|
|
|
|
|
|
|
|
410
|
|
|
|
|
|
|
#get the utterances that match the tag |
411
|
4
|
|
|
|
|
16
|
my $part = MetaMap::DataStructures::Citation->new($self->{id}); |
412
|
4
|
|
|
|
|
6
|
foreach my $key(keys %{$self->{utterances}}) { |
|
4
|
|
|
|
|
12
|
|
413
|
4
|
50
|
|
|
|
35
|
if($key =~ /(ti|ab)/) { |
414
|
4
|
100
|
|
|
|
19
|
if ($1 eq $tag) { |
415
|
2
|
|
|
|
|
5
|
$part->addUtterance($self->{utterances}{$key}); |
416
|
|
|
|
|
|
|
} |
417
|
|
|
|
|
|
|
} |
418
|
|
|
|
|
|
|
} |
419
|
|
|
|
|
|
|
#return the title citation |
420
|
4
|
|
|
|
|
12
|
return $part; |
421
|
|
|
|
|
|
|
} |
422
|
|
|
|
|
|
|
#----------------------------------------------------------------------- |
423
|
|
|
|
|
|
|
|
424
|
|
|
|
|
|
|
1; |
425
|
|
|
|
|
|
|
|
426
|
|
|
|
|
|
|
__END__ |