David Hrachovy commited on
Commit
9135c43
·
1 Parent(s): 82a0223
Files changed (3) hide show
  1. app.py +7 -7
  2. estate.db +2 -2
  3. init_db.py +3 -6
app.py CHANGED
@@ -12,7 +12,7 @@ from langchain_community.agent_toolkits.sql.toolkit import SQLDatabaseToolkit
12
  from langchain_openai import ChatOpenAI
13
 
14
  # Local imports
15
- from init_db import db_description, Project
16
 
17
  # Load environment variables
18
  load_dotenv()
@@ -24,7 +24,7 @@ if not os.path.exists('estate.db'):
24
  )
25
 
26
  # Initialize model and database
27
- model = ChatOpenAI(model="gpt-4o-2024-08-06", streaming=True)
28
  db = SQLDatabase.from_uri("sqlite:///estate.db")
29
 
30
  # Set up SQL toolkit and tools
@@ -51,7 +51,7 @@ LIMIT 5;
51
 
52
  # Get the OpenAI tools agent prompt
53
  prompt = ChatPromptTemplate.from_messages([
54
- ("system", "You are a helpful assistant. You speak Czech. You can answer questions about real estate projects (novostavby) in Czech Republic. You have access to a database of real estate projects (translate output to Czech too). Some info about the structure of the database: " + db_description + "Note that some json values can be null so you must sometimes so make sure to add IS NOT NULL when appropriate. Always query projects with structure->'$.ignore'=false or NULL. For calculating you can adapt this query: " + sql_distance_query),
55
  ("placeholder", "{chat_history}"),
56
  ("human", "{input}"),
57
  ("placeholder", "{agent_scratchpad}"),
@@ -91,11 +91,11 @@ count_projects = Project.select().where(Project.structure.is_null(False)).count(
91
  demo = gr.ChatInterface(
92
  fn=chat_with_sql,
93
  title="Estate Chat",
94
- description=f"Plánuješ koupit novostavbu? Zeptej se na {count_projects} novostaveb v ČR 🇨🇿",
95
  examples=[
96
- "Projekt s nejnižším vkladem",
97
- "Nejlevnější byt v Praze",
98
- "Nejmenší m2 v Praze"
99
  ],
100
  type="messages"
101
  )
 
12
  from langchain_openai import ChatOpenAI
13
 
14
  # Local imports
15
+ from init_db import Project, db_description, json_structure
16
 
17
  # Load environment variables
18
  load_dotenv()
 
24
  )
25
 
26
  # Initialize model and database
27
+ model = ChatOpenAI(model="o3-mini-2025-01-31", streaming=True)
28
  db = SQLDatabase.from_uri("sqlite:///estate.db")
29
 
30
  # Set up SQL toolkit and tools
 
51
 
52
  # Get the OpenAI tools agent prompt
53
  prompt = ChatPromptTemplate.from_messages([
54
+ ("system", f"You are a helpful assistant that presents information about real estate projects in database for investors. Before executing queries make surey youhave schema of dabatase and first rows. This JSON structure info can help you: {json_structure}."),
55
  ("placeholder", "{chat_history}"),
56
  ("human", "{input}"),
57
  ("placeholder", "{agent_scratchpad}"),
 
91
  demo = gr.ChatInterface(
92
  fn=chat_with_sql,
93
  title="Estate Chat",
94
+ description=f"Planning to buy a new apartment? Ask me about {count_projects} new buildings (novostavby) in Prague 🇨🇿",
95
  examples=[
96
+ "Project with the lowest deposit before completion",
97
+ "Cheapest apartment in Prague",
98
+ "Best price per sqm in Prague"
99
  ],
100
  type="messages"
101
  )
estate.db CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17722ed41be0a8aeb7fd4a4598bee19c04b4c6d0eb745b172263f9f3ca53bb48
3
- size 2527232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb20aad2ca84e0866daaf3888ddcc304f123dc9671afdd45adc2fa2e0a2036c9
3
+ size 2560000
init_db.py CHANGED
@@ -4,17 +4,14 @@ from playhouse.sqlite_ext import *
4
 
5
  # Initialize database
6
 
7
- json_structure = "JSON column with hash with keys 'title': str, official title of the project, 'deposit': int, initial deposit (in percentage) for apartments or null if unknown, 'min_price': int, lowest available apartment price with VAT. It should not be booked or sold., 'average_price_per_sqm': int, average price per square meter of the lowest available apartment. If they sell house and not apartment, calculate only from the apartment size, not size of garden (land), 'status': str, status of the project (preparation, selling, sold out), 'city': str, city of the project, 'lat': float, gps coordinates of the project, 'lng': float, gps coordinates of the project, 'start_year': int, year of construction start, 'end_year': int, estimated year of construction end, 'developer': str, name of the contruction company/developer, 'ignore': bool, if True, the project does not have any apartments for sale, Some values can be null/unknown"
8
 
9
- db = SqliteExtDatabase('estate.db', pragmas=(
10
- ('cache_size', -1024 * 64), # 64MB page-cache.
11
- ('journal_mode', 'wal'), # Use WAL-mode (you should always use this!).
12
- ('foreign_keys', 1))) # Enforce foreign-key constraints.
13
 
14
  db_description = f"""Table "project" - list of real estate projects (novostavby) in Czech Republic
15
  url: url of the project.
16
  structure: {json_structure}.
17
- content: contents of the website, information about the project.
18
  created_at: date and time of creation.
19
  """
20
 
 
4
 
5
  # Initialize database
6
 
7
+ json_structure = "JSON column with hash with keys 'title': str, official title of the project, 'deposit': int (in percentage), sum of all deposit payments before the apartment is complete. 'min_price': int, lowest available apartment price in CZK with VAT. It should not be booked or sold., 'average_price_per_sqm': int, average price per square meter of the lowest available apartment. 'status': str, status of the project (preparation, selling, sold out), 'city': str, city of the project, 'lat': float, gps coordinates of the project, 'lng': float, gps coordinates of the project, 'start_year': int, year of construction start, 'end_year': int, estimated year of construction end, 'developer': str, name of the contruction company/developer, 'ignore': bool, if True, the project does not have any apartments for sale. Some values can be null/unknown"
8
 
9
+ db = SqliteExtDatabase('estate.db')
 
 
 
10
 
11
  db_description = f"""Table "project" - list of real estate projects (novostavby) in Czech Republic
12
  url: url of the project.
13
  structure: {json_structure}.
14
+ content: unstructured additional information about the project.
15
  created_at: date and time of creation.
16
  """
17