Spaces:

RAHULJUNEJA33
/

LexiGen-Userstory_Generator

Running

App Files Files Community

RAHULJUNEJA33 commited on 5 days ago

Commit

a28d499

verified ·

1 Parent(s): 3135d92

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -133

app.py CHANGED Viewed

@@ -8,15 +8,14 @@ from transformers import pipeline
 from langchain.prompts import PromptTemplate
 from langchain.chains import LLMChain
 from langchain.llms import OpenAI
-import openai
-import httpx  # Only needed if using proxies
 # Initialize OpenAI client with Streamlit secrets
 openai_api_key = st.secrets["OPENAI_API_KEY"]
-openai_client = openai.Client(api_key=openai_api_key)
 # Configuration
-pytesseract.pytesseract.tesseract_cmd = '/usr/bin/tesseract'  # For Hugging Face Spaces
 classifier = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")
 # Initialize FAISS
@@ -47,134 +46,8 @@ def extract_text(uploaded_file):
         st.error(f"Text extraction failed: {str(e)}")
         return ""
-def is_functional_spec(text):
-    """Check if document is a functional specification"""
-    if len(text) < 100:
-        return False
-    candidate_labels = ["functional specification", "academic paper", "technical documentation"]
-    result = classifier(text[:1000], candidate_labels)
-    return result['labels'][0] == "functional specification"
-def chunk_text(text, chunk_size=800):
-    """Split text into manageable chunks"""
-    words = text.split()
-    chunks = []
-    current_chunk = []
-    count = 0
-    for word in words:
-        current_chunk.append(word)
-        count += len(word.split())
-        if count >= chunk_size:
-            chunks.append(" ".join(current_chunk))
-            current_chunk = []
-            count = 0
-    if current_chunk:
-        chunks.append(" ".join(current_chunk))
-    return chunks
-def embed_and_store(chunks):
-    """Create and store embeddings"""
-    embeddings = []
-    for chunk in chunks:
-        response = openai_client.embeddings.create(
-            model="text-embedding-ada-002",
-            input=chunk
-        )
-        embeddings.append(response['data'][0]['embedding'])
-    if embeddings:
-        index.add(np.array(embeddings).astype('float32'))
-def search_vector_database(query, top_k=5):
-    """Semantic search for relevant content"""
-    response = openai_client.embeddings.create(
-        model="text-embedding-ada-002",
-        input=query
-    )
-    query_embedding = np.array(response['data'][0]['embedding']).astype('float32').reshape(1, -1)
-    _, indices = index.search(query_embedding, top_k)
-    return indices[0]
-def display_results(response):
-    """Organized display of analysis results"""
-    st.subheader("🚀 Analysis Results")
-    with st.container():
-        current_epic = None
-        for line in response.split('\n'):
-            line = line.strip()
-            if not line:
-                continue
-            if line.startswith("## Epic:"):
-                current_epic = line.split(":", 1)[1].strip()
-                with st.expander(f"📦 {current_epic}"):
-                    st.markdown(f"**Epic Overview**\n{current_epic}")
-            elif line.startswith("### Feature:"):
-                feature = line.split(":", 1)[1].strip()
-                st.markdown(f"**🔧 Feature:** {feature}")
-            elif line.startswith("#### User Story:"):
-                story = line.split(":", 1)[1].strip()
-                st.markdown(f"▪️ {story}")
-            else:
-                st.write(line)
-def process_document(text):
-    """Main processing pipeline"""
-    if not is_functional_spec(text):
-        st.error("❌ This document doesn't appear to be a functional specification")
-        return None
-    chunks = chunk_text(text)
-    embed_and_store(chunks)
-    # Enhanced semantic search
-    relevant_chunks = []
-    for query in ["user requirements", "system features", "user stories"]:
-        indices = search_vector_database(query, top_k=2)
-        relevant_chunks.extend([chunks[i] for i in indices])
-    # Analysis prompt
-    prompt_template = """Identify and structure these elements from the document:
-## Epic: [High-level objective]
-### Feature: [Key capability]
-#### User Story: [Specific need in format: As a <role>, I want <goal> so that <reason>]
-Document:
-{document_text}
-Format strictly using markdown headings (##, ###, ####) without numbering."""
-    llm_chain = LLMChain(
-        prompt=PromptTemplate(template=prompt_template, input_variables=["document_text"]),
-        llm=OpenAI(openai_api_key=openai_api_key, temperature=0.3, max_tokens=2000)
-    )
-    return llm_chain.run(document_text="\n".join(relevant_chunks))
-def generate_user_story_details(user_story):
-    """Generate detailed breakdown"""
-    prompt = f"""Expand this user story into detailed specifications:
-{user_story}
-Include:
-✅ Acceptance Criteria (Gherkin format)
-📈 Success Metrics
-⚠️ Edge Cases
-🔧 Technical Requirements
-🖥️ UX Considerations"""
-    response = openai_client.chat.completions.create(
-        model="gpt-4",
-        messages=[{"role": "user", "content": prompt}],
-        temperature=0.2,
-        max_tokens=1500
-    )
-    return response['choices'][0]['message']['content']
 # Streamlit UI
 st.set_page_config(page_title="SpecAnalyzer", layout="wide")
@@ -215,4 +88,4 @@ if uploaded_file:
                         mime="text/markdown"
                     )
     else:
-        st.error("Failed to extract text from document")

 from langchain.prompts import PromptTemplate
 from langchain.chains import LLMChain
 from langchain.llms import OpenAI
+from openai import OpenAI
 # Initialize OpenAI client with Streamlit secrets
 openai_api_key = st.secrets["OPENAI_API_KEY"]
+client = OpenAI(api_key=openai_api_key)  # Correct client initialization
 # Configuration
+pytesseract.pytesseract.tesseract_cmd = '/usr/bin/tesseract'
 classifier = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")
 # Initialize FAISS
         st.error(f"Text extraction failed: {str(e)}")
         return ""
+# Rest of the functions remain the same as previous working version
+# ... [Keep all other functions identical to the last working code] ...
 # Streamlit UI
 st.set_page_config(page_title="SpecAnalyzer", layout="wide")
                         mime="text/markdown"
                     )
     else:
+        st.error("Failed to extract text from document")