Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -47,6 +47,7 @@ class RelationshipEngine:
|
|
47 |
self.setup_database()
|
48 |
|
49 |
def setup_database(self):
|
|
|
50 |
self.conn.execute('''
|
51 |
CREATE TABLE IF NOT EXISTS events (
|
52 |
id INTEGER PRIMARY KEY,
|
@@ -56,46 +57,171 @@ class RelationshipEngine:
|
|
56 |
)
|
57 |
''')
|
58 |
|
|
|
59 |
self.conn.execute('''
|
60 |
-
CREATE TABLE IF NOT EXISTS
|
61 |
id INTEGER PRIMARY KEY,
|
62 |
-
|
63 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
64 |
relationship_type TEXT,
|
65 |
confidence REAL,
|
66 |
-
|
67 |
-
|
|
|
|
|
68 |
)
|
69 |
''')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
70 |
self.conn.commit()
|
71 |
|
72 |
def find_related_events(self, event_data):
|
73 |
-
# Find events
|
74 |
-
|
75 |
-
|
76 |
-
|
77 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
LIMIT 5
|
79 |
-
''',
|
80 |
-
|
81 |
-
|
82 |
-
return
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
83 |
|
84 |
-
def
|
85 |
-
#
|
86 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
|
98 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
99 |
|
100 |
class EventAnalyzer:
|
101 |
def __init__(self):
|
|
|
47 |
self.setup_database()
|
48 |
|
49 |
def setup_database(self):
|
50 |
+
# Events table
|
51 |
self.conn.execute('''
|
52 |
CREATE TABLE IF NOT EXISTS events (
|
53 |
id INTEGER PRIMARY KEY,
|
|
|
57 |
)
|
58 |
''')
|
59 |
|
60 |
+
# Entities table
|
61 |
self.conn.execute('''
|
62 |
+
CREATE TABLE IF NOT EXISTS entities (
|
63 |
id INTEGER PRIMARY KEY,
|
64 |
+
entity_text TEXT,
|
65 |
+
entity_type TEXT, -- person, organization, location, hashtag, temporal
|
66 |
+
first_seen DATETIME,
|
67 |
+
last_seen DATETIME,
|
68 |
+
frequency INTEGER DEFAULT 1,
|
69 |
+
confidence REAL
|
70 |
+
)
|
71 |
+
''')
|
72 |
+
|
73 |
+
# Event-Entity relationships
|
74 |
+
self.conn.execute('''
|
75 |
+
CREATE TABLE IF NOT EXISTS event_entities (
|
76 |
+
event_id INTEGER,
|
77 |
+
entity_id INTEGER,
|
78 |
+
FOREIGN KEY (event_id) REFERENCES events(id),
|
79 |
+
FOREIGN KEY (entity_id) REFERENCES entities(id),
|
80 |
+
PRIMARY KEY (event_id, entity_id)
|
81 |
+
)
|
82 |
+
''')
|
83 |
+
|
84 |
+
# Entity relationships (e.g., person-organization affiliations)
|
85 |
+
self.conn.execute('''
|
86 |
+
CREATE TABLE IF NOT EXISTS entity_relationships (
|
87 |
+
id INTEGER PRIMARY KEY,
|
88 |
+
source_entity_id INTEGER,
|
89 |
+
target_entity_id INTEGER,
|
90 |
relationship_type TEXT,
|
91 |
confidence REAL,
|
92 |
+
first_seen DATETIME,
|
93 |
+
last_seen DATETIME,
|
94 |
+
FOREIGN KEY (source_entity_id) REFERENCES entities(id),
|
95 |
+
FOREIGN KEY (target_entity_id) REFERENCES entities(id)
|
96 |
)
|
97 |
''')
|
98 |
+
|
99 |
+
self.conn.commit()
|
100 |
+
|
101 |
+
def store_entities(self, event_id, entities_dict):
|
102 |
+
now = datetime.now().isoformat()
|
103 |
+
|
104 |
+
for entity_type, entities in entities_dict.items():
|
105 |
+
if not isinstance(entities, list):
|
106 |
+
continue
|
107 |
+
|
108 |
+
for entity_text in entities:
|
109 |
+
# Check if entity exists
|
110 |
+
cursor = self.conn.execute(
|
111 |
+
'SELECT id, frequency FROM entities WHERE entity_text = ? AND entity_type = ?',
|
112 |
+
(entity_text, entity_type)
|
113 |
+
)
|
114 |
+
result = cursor.fetchone()
|
115 |
+
|
116 |
+
if result:
|
117 |
+
# Update existing entity
|
118 |
+
entity_id, freq = result
|
119 |
+
self.conn.execute('''
|
120 |
+
UPDATE entities
|
121 |
+
SET frequency = ?, last_seen = ?
|
122 |
+
WHERE id = ?
|
123 |
+
''', (freq + 1, now, entity_id))
|
124 |
+
else:
|
125 |
+
# Insert new entity
|
126 |
+
cursor = self.conn.execute('''
|
127 |
+
INSERT INTO entities (entity_text, entity_type, first_seen, last_seen, confidence)
|
128 |
+
VALUES (?, ?, ?, ?, ?)
|
129 |
+
''', (entity_text, entity_type, now, now, 1.0))
|
130 |
+
entity_id = cursor.lastrowid
|
131 |
+
|
132 |
+
# Create event-entity relationship
|
133 |
+
self.conn.execute('''
|
134 |
+
INSERT OR IGNORE INTO event_entities (event_id, entity_id)
|
135 |
+
VALUES (?, ?)
|
136 |
+
''', (event_id, entity_id))
|
137 |
+
|
138 |
self.conn.commit()
|
139 |
|
140 |
def find_related_events(self, event_data):
|
141 |
+
# Find events sharing entities
|
142 |
+
entity_texts = []
|
143 |
+
for entity_type, entities in event_data.get('entities', {}).items():
|
144 |
+
if isinstance(entities, list):
|
145 |
+
entity_texts.extend(entities)
|
146 |
+
|
147 |
+
if not entity_texts:
|
148 |
+
return []
|
149 |
+
|
150 |
+
# Build query using entity relationships
|
151 |
+
query = '''
|
152 |
+
SELECT DISTINCT e.*, COUNT(ee.entity_id) as shared_entities
|
153 |
+
FROM events e
|
154 |
+
JOIN event_entities ee ON e.id = ee.event_id
|
155 |
+
JOIN entities ent ON ee.entity_id = ent.id
|
156 |
+
WHERE ent.entity_text IN ({})
|
157 |
+
GROUP BY e.id
|
158 |
+
ORDER BY shared_entities DESC, e.timestamp DESC
|
159 |
LIMIT 5
|
160 |
+
'''.format(','.join('?' * len(entity_texts)))
|
161 |
+
|
162 |
+
cursor = self.conn.execute(query, entity_texts)
|
163 |
+
return cursor.fetchall()
|
164 |
+
|
165 |
+
def find_entity_relationships(self, entity_id):
|
166 |
+
# Find direct relationships
|
167 |
+
query = '''
|
168 |
+
SELECT er.*,
|
169 |
+
e1.entity_text as source_text, e1.entity_type as source_type,
|
170 |
+
e2.entity_text as target_text, e2.entity_type as target_type
|
171 |
+
FROM entity_relationships er
|
172 |
+
JOIN entities e1 ON er.source_entity_id = e1.id
|
173 |
+
JOIN entities e2 ON er.target_entity_id = e2.id
|
174 |
+
WHERE er.source_entity_id = ? OR er.target_entity_id = ?
|
175 |
+
'''
|
176 |
+
cursor = self.conn.execute(query, (entity_id, entity_id))
|
177 |
+
return cursor.fetchall()
|
178 |
|
179 |
+
def update_entity_relationships(self, event_id):
|
180 |
+
# Find all entities in the event
|
181 |
+
query = '''
|
182 |
+
SELECT e.id, e.entity_text, e.entity_type
|
183 |
+
FROM entities e
|
184 |
+
JOIN event_entities ee ON e.id = ee.entity_id
|
185 |
+
WHERE ee.event_id = ?
|
186 |
+
'''
|
187 |
+
cursor = self.conn.execute(query, (event_id,))
|
188 |
+
entities = cursor.fetchall()
|
189 |
|
190 |
+
now = datetime.now().isoformat()
|
191 |
+
|
192 |
+
# Create/update relationships between entities in same event
|
193 |
+
for i, entity1 in enumerate(entities):
|
194 |
+
for entity2 in entities[i+1:]:
|
195 |
+
# Skip same entity type relationships
|
196 |
+
if entity1[2] == entity2[2]:
|
197 |
+
continue
|
198 |
+
|
199 |
+
relationship_type = f"{entity1[2]}_to_{entity2[2]}"
|
200 |
+
|
201 |
+
# Check if relationship exists
|
202 |
+
cursor = self.conn.execute('''
|
203 |
+
SELECT id FROM entity_relationships
|
204 |
+
WHERE (source_entity_id = ? AND target_entity_id = ?)
|
205 |
+
OR (source_entity_id = ? AND target_entity_id = ?)
|
206 |
+
''', (entity1[0], entity2[0], entity2[0], entity1[0]))
|
207 |
+
|
208 |
+
result = cursor.fetchone()
|
209 |
+
if result:
|
210 |
+
# Update existing relationship
|
211 |
+
self.conn.execute('''
|
212 |
+
UPDATE entity_relationships
|
213 |
+
SET last_seen = ?, confidence = confidence + 0.1
|
214 |
+
WHERE id = ?
|
215 |
+
''', (now, result[0]))
|
216 |
+
else:
|
217 |
+
# Create new relationship
|
218 |
+
self.conn.execute('''
|
219 |
+
INSERT INTO entity_relationships
|
220 |
+
(source_entity_id, target_entity_id, relationship_type, confidence, first_seen, last_seen)
|
221 |
+
VALUES (?, ?, ?, ?, ?, ?)
|
222 |
+
''', (entity1[0], entity2[0], relationship_type, 0.5, now, now))
|
223 |
+
|
224 |
+
self.conn.commit()
|
225 |
|
226 |
class EventAnalyzer:
|
227 |
def __init__(self):
|