Spaces:

victor-johnson
/

emmet-generator

Running

victor-johnson commited on 15 days ago

Commit

4c456b6

verified ·

1 Parent(s): 510de5b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,28 +1,37 @@
-import os
 from fastapi import FastAPI
 from pydantic import BaseModel
-from transformers import pipeline, AutoTokenizer, AutoModelForCausalLM
-from langchain_community.llms import HuggingFacePipeline
-from langchain import PromptTemplate, LLMChain
-# — Model setup (small enough to CPU-serve in a Space) —
 MODEL_ID = "bigcode/starcoder2-3b"
-tokenizer = AutoTokenizer.from_pretrained(MODEL_ID,trust_remote_code=True)
-model = AutoModelForCausalLM.from_pretrained(MODEL_ID,trust_remote_code=True)
-# wrap in a HF pipeline and LangChain LLM
-pipe = pipeline(
-    "text-generation",
-    model=model,
-    tokenizer=tokenizer,
     max_new_tokens=64,
     temperature=0.2,
     top_p=0.95,
     do_sample=False,
 )
 llm = HuggingFacePipeline(pipeline=pipe)
-# define a simple prompt → chain
 prompt = PromptTemplate(
     input_variables=["description"],
     template=(
@@ -33,7 +42,7 @@ prompt = PromptTemplate(
 )
 chain = LLMChain(llm=llm, prompt=prompt)
-# FastAPI app
 app = FastAPI()
 class Req(BaseModel):
@@ -44,7 +53,6 @@ class Res(BaseModel):
 @app.post("/generate-emmet", response_model=Res)
 async def generate_emmet(req: Req):
-    raw = chain.run(req.description)
-    # take just the first line after the prompt
     emmet = raw.strip().splitlines()[0]
     return {"emmet": emmet}

 from fastapi import FastAPI
 from pydantic import BaseModel
+from transformers import (
+    pipeline,
+    AutoTokenizer,
+    AutoModelForCausalLM,
+    GenerationConfig,
+)
+from langchain_huggingface import HuggingFacePipeline
+from langchain_core.prompts import PromptTemplate
+from langchain.chains import LLMChain
+# — Model setup —
 MODEL_ID = "bigcode/starcoder2-3b"
+tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
+model = AutoModelForCausalLM.from_pretrained(MODEL_ID, trust_remote_code=True)
+# — Generation config & pipeline (new API) —
+gen_config = GenerationConfig(
     max_new_tokens=64,
     temperature=0.2,
     top_p=0.95,
     do_sample=False,
 )
+pipe = pipeline(
+    "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    device_map="auto",
+    generation_config=gen_config,
+)
 llm = HuggingFacePipeline(pipeline=pipe)
+# — Prompt & chain —
 prompt = PromptTemplate(
     input_variables=["description"],
     template=(
 )
 chain = LLMChain(llm=llm, prompt=prompt)
+# — FastAPI app —
 app = FastAPI()
 class Req(BaseModel):
 @app.post("/generate-emmet", response_model=Res)
 async def generate_emmet(req: Req):
+    raw = chain.invoke(req.description)  # use .invoke() instead of deprecated .run()
     emmet = raw.strip().splitlines()[0]
     return {"emmet": emmet}