dwb2023 commited on
Commit
e8d9eb9
·
verified ·
1 Parent(s): 2d49246

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +154 -28
app.py CHANGED
@@ -47,6 +47,7 @@ class RelationshipEngine:
47
  self.setup_database()
48
 
49
  def setup_database(self):
 
50
  self.conn.execute('''
51
  CREATE TABLE IF NOT EXISTS events (
52
  id INTEGER PRIMARY KEY,
@@ -56,46 +57,171 @@ class RelationshipEngine:
56
  )
57
  ''')
58
 
 
59
  self.conn.execute('''
60
- CREATE TABLE IF NOT EXISTS relationships (
61
  id INTEGER PRIMARY KEY,
62
- source_event_id INTEGER,
63
- target_event_id INTEGER,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  relationship_type TEXT,
65
  confidence REAL,
66
- FOREIGN KEY (source_event_id) REFERENCES events(id),
67
- FOREIGN KEY (target_event_id) REFERENCES events(id)
 
 
68
  )
69
  ''')
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  self.conn.commit()
71
 
72
  def find_related_events(self, event_data):
73
- # Find events with similar entities
74
- cursor = self.conn.execute('''
75
- SELECT * FROM events
76
- WHERE text LIKE ?
77
- ORDER BY timestamp DESC
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  LIMIT 5
79
- ''', (f"%{event_data.get('text', '')}%",))
80
-
81
- related_events = cursor.fetchall()
82
- return related_events
 
 
 
 
 
 
 
 
 
 
 
 
 
 
83
 
84
- def calculate_relationship_confidence(self, event1, event2):
85
- # Simple similarity-based confidence
86
- base_confidence = 0.0
 
 
 
 
 
 
 
87
 
88
- # Entity overlap increases confidence
89
- if set(event1.get('entities', {}).get('people', [])) & set(event2.get('entities', {}).get('people', [])):
90
- base_confidence += 0.3
91
-
92
- if set(event1.get('entities', {}).get('organizations', [])) & set(event2.get('entities', {}).get('organizations', [])):
93
- base_confidence += 0.3
94
-
95
- if set(event1.get('entities', {}).get('locations', [])) & set(event2.get('entities', {}).get('locations', [])):
96
- base_confidence += 0.4
97
-
98
- return min(base_confidence, 1.0)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
 
100
  class EventAnalyzer:
101
  def __init__(self):
 
47
  self.setup_database()
48
 
49
  def setup_database(self):
50
+ # Events table
51
  self.conn.execute('''
52
  CREATE TABLE IF NOT EXISTS events (
53
  id INTEGER PRIMARY KEY,
 
57
  )
58
  ''')
59
 
60
+ # Entities table
61
  self.conn.execute('''
62
+ CREATE TABLE IF NOT EXISTS entities (
63
  id INTEGER PRIMARY KEY,
64
+ entity_text TEXT,
65
+ entity_type TEXT, -- person, organization, location, hashtag, temporal
66
+ first_seen DATETIME,
67
+ last_seen DATETIME,
68
+ frequency INTEGER DEFAULT 1,
69
+ confidence REAL
70
+ )
71
+ ''')
72
+
73
+ # Event-Entity relationships
74
+ self.conn.execute('''
75
+ CREATE TABLE IF NOT EXISTS event_entities (
76
+ event_id INTEGER,
77
+ entity_id INTEGER,
78
+ FOREIGN KEY (event_id) REFERENCES events(id),
79
+ FOREIGN KEY (entity_id) REFERENCES entities(id),
80
+ PRIMARY KEY (event_id, entity_id)
81
+ )
82
+ ''')
83
+
84
+ # Entity relationships (e.g., person-organization affiliations)
85
+ self.conn.execute('''
86
+ CREATE TABLE IF NOT EXISTS entity_relationships (
87
+ id INTEGER PRIMARY KEY,
88
+ source_entity_id INTEGER,
89
+ target_entity_id INTEGER,
90
  relationship_type TEXT,
91
  confidence REAL,
92
+ first_seen DATETIME,
93
+ last_seen DATETIME,
94
+ FOREIGN KEY (source_entity_id) REFERENCES entities(id),
95
+ FOREIGN KEY (target_entity_id) REFERENCES entities(id)
96
  )
97
  ''')
98
+
99
+ self.conn.commit()
100
+
101
+ def store_entities(self, event_id, entities_dict):
102
+ now = datetime.now().isoformat()
103
+
104
+ for entity_type, entities in entities_dict.items():
105
+ if not isinstance(entities, list):
106
+ continue
107
+
108
+ for entity_text in entities:
109
+ # Check if entity exists
110
+ cursor = self.conn.execute(
111
+ 'SELECT id, frequency FROM entities WHERE entity_text = ? AND entity_type = ?',
112
+ (entity_text, entity_type)
113
+ )
114
+ result = cursor.fetchone()
115
+
116
+ if result:
117
+ # Update existing entity
118
+ entity_id, freq = result
119
+ self.conn.execute('''
120
+ UPDATE entities
121
+ SET frequency = ?, last_seen = ?
122
+ WHERE id = ?
123
+ ''', (freq + 1, now, entity_id))
124
+ else:
125
+ # Insert new entity
126
+ cursor = self.conn.execute('''
127
+ INSERT INTO entities (entity_text, entity_type, first_seen, last_seen, confidence)
128
+ VALUES (?, ?, ?, ?, ?)
129
+ ''', (entity_text, entity_type, now, now, 1.0))
130
+ entity_id = cursor.lastrowid
131
+
132
+ # Create event-entity relationship
133
+ self.conn.execute('''
134
+ INSERT OR IGNORE INTO event_entities (event_id, entity_id)
135
+ VALUES (?, ?)
136
+ ''', (event_id, entity_id))
137
+
138
  self.conn.commit()
139
 
140
  def find_related_events(self, event_data):
141
+ # Find events sharing entities
142
+ entity_texts = []
143
+ for entity_type, entities in event_data.get('entities', {}).items():
144
+ if isinstance(entities, list):
145
+ entity_texts.extend(entities)
146
+
147
+ if not entity_texts:
148
+ return []
149
+
150
+ # Build query using entity relationships
151
+ query = '''
152
+ SELECT DISTINCT e.*, COUNT(ee.entity_id) as shared_entities
153
+ FROM events e
154
+ JOIN event_entities ee ON e.id = ee.event_id
155
+ JOIN entities ent ON ee.entity_id = ent.id
156
+ WHERE ent.entity_text IN ({})
157
+ GROUP BY e.id
158
+ ORDER BY shared_entities DESC, e.timestamp DESC
159
  LIMIT 5
160
+ '''.format(','.join('?' * len(entity_texts)))
161
+
162
+ cursor = self.conn.execute(query, entity_texts)
163
+ return cursor.fetchall()
164
+
165
+ def find_entity_relationships(self, entity_id):
166
+ # Find direct relationships
167
+ query = '''
168
+ SELECT er.*,
169
+ e1.entity_text as source_text, e1.entity_type as source_type,
170
+ e2.entity_text as target_text, e2.entity_type as target_type
171
+ FROM entity_relationships er
172
+ JOIN entities e1 ON er.source_entity_id = e1.id
173
+ JOIN entities e2 ON er.target_entity_id = e2.id
174
+ WHERE er.source_entity_id = ? OR er.target_entity_id = ?
175
+ '''
176
+ cursor = self.conn.execute(query, (entity_id, entity_id))
177
+ return cursor.fetchall()
178
 
179
+ def update_entity_relationships(self, event_id):
180
+ # Find all entities in the event
181
+ query = '''
182
+ SELECT e.id, e.entity_text, e.entity_type
183
+ FROM entities e
184
+ JOIN event_entities ee ON e.id = ee.entity_id
185
+ WHERE ee.event_id = ?
186
+ '''
187
+ cursor = self.conn.execute(query, (event_id,))
188
+ entities = cursor.fetchall()
189
 
190
+ now = datetime.now().isoformat()
191
+
192
+ # Create/update relationships between entities in same event
193
+ for i, entity1 in enumerate(entities):
194
+ for entity2 in entities[i+1:]:
195
+ # Skip same entity type relationships
196
+ if entity1[2] == entity2[2]:
197
+ continue
198
+
199
+ relationship_type = f"{entity1[2]}_to_{entity2[2]}"
200
+
201
+ # Check if relationship exists
202
+ cursor = self.conn.execute('''
203
+ SELECT id FROM entity_relationships
204
+ WHERE (source_entity_id = ? AND target_entity_id = ?)
205
+ OR (source_entity_id = ? AND target_entity_id = ?)
206
+ ''', (entity1[0], entity2[0], entity2[0], entity1[0]))
207
+
208
+ result = cursor.fetchone()
209
+ if result:
210
+ # Update existing relationship
211
+ self.conn.execute('''
212
+ UPDATE entity_relationships
213
+ SET last_seen = ?, confidence = confidence + 0.1
214
+ WHERE id = ?
215
+ ''', (now, result[0]))
216
+ else:
217
+ # Create new relationship
218
+ self.conn.execute('''
219
+ INSERT INTO entity_relationships
220
+ (source_entity_id, target_entity_id, relationship_type, confidence, first_seen, last_seen)
221
+ VALUES (?, ?, ?, ?, ?, ?)
222
+ ''', (entity1[0], entity2[0], relationship_type, 0.5, now, now))
223
+
224
+ self.conn.commit()
225
 
226
  class EventAnalyzer:
227
  def __init__(self):