Init : boilerplate

aryanraj2713 · aryanraj2713 · commit cc518f25201e · 2024-10-19T11:09:33.000+05:30
diff --git a/Dockerfile b/Dockerfile
@@ -0,0 +1,12 @@
+FROM public.ecr.aws/lambda/python:3.10
+
+# Copy function code
+COPY ./app ${LAMBDA_TASK_ROOT}
+
+# Install the function's dependencies using file requirements.txt
+# from your project folder.
+COPY requirements.txt .
+RUN pip3 install -r requirements.txt --target "${LAMBDA_TASK_ROOT}" --upgrade --no-cache-dir
+
+# Set the CMD to your handler (could also be done as a parameter override outside of the Dockerfile)
+CMD [ "app.handler" ]
diff --git a/app/__init__.py b/app/__init__.py
diff --git a/app/app.py b/app/app.py
@@ -0,0 +1,170 @@
+from fastapi import FastAPI, UploadFile, File
+from fastapi.responses import JSONResponse
+import uvicorn
+import os
+from groq import Groq
+import PyPDF2
+from pptx import Presentation
+import io
+from PIL import Image
+import tempfile
+import base64
+from mangum import Mangum
+
+app = FastAPI()
+handler = Mangum(app)
+# Initialize Groq client
+client = Groq(
+    api_key="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",
+)
+
+@app.get("/")
+async def root():
+    return {"message": "Welcome"}
+
+@app.get("/greeting")
+async def greeting():
+    return {"message": "Hello", "details": "You are using LAamAScholar Bot"}
+
+@app.post("/summarize")
+async def summarize_file(file: UploadFile = File(...)):
+    content = await file.read()
+    
+    if file.filename.endswith('.pdf'):
+        text = extract_text_from_pdf(content)
+    elif file.filename.endswith('.pptx'):
+        text = extract_text_from_pptx(content)
+    else:
+        return JSONResponse(status_code=400, content={"error": "Unsupported file format. Please upload a PDF or PPTX file."})
+    
+    summary = summarize_text(text)
+    return {"summary": summary}
+
+@app.post("/generate_questions")
+async def generate_questions(file: UploadFile = File(...)):
+    content = await file.read()
+    
+    if file.filename.endswith('.pdf'):
+        text = extract_text_from_pdf(content)
+    elif file.filename.endswith('.pptx'):
+        text = extract_text_from_pptx(content)
+    else:
+        return JSONResponse(status_code=400, content={"error": "Unsupported file format. Please upload a PDF or PPTX file."})
+    
+    questions = generate_important_questions(text)
+    return {"questions": questions}
+
+@app.post("/voice-notes")
+async def transcribe_voice_notes(file: UploadFile = File(...)):
+    if not file.filename.endswith('.mp3'):
+        return JSONResponse(status_code=400, content={"error": "Unsupported file format. Please upload an MP3 file."})
+    
+    # Create a temporary file to store the uploaded content
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as temp_file:
+        content = await file.read()
+        temp_file.write(content)
+        temp_file_path = temp_file.name
+
+    try:
+        with open(temp_file_path, "rb") as audio_file:
+            transcription = client.audio.transcriptions.create(
+                file=(file.filename, audio_file),
+                model="whisper-large-v3",
+                response_format="verbose_json",
+            )
+        
+        return {"transcription": transcription.text}
+    finally:
+        # Clean up the temporary file
+        os.unlink(temp_file_path)
+def encode_image(image_file):
+    return base64.b64encode(image_file.read()).decode('utf-8')
+
+@app.post("/ocr/")
+async def perform_ocr(file: UploadFile = File(...)):
+    # Read and encode the image
+    contents = await file.read()
+    base64_image = encode_image(io.BytesIO(contents))
+
+    # Prepare the message for Groq
+    messages = [
+        {
+            "role": "user",
+            "content": [
+                {
+                    "type": "image_url",
+                    "image_url": {
+                        "url": f"data:image/jpeg;base64,{base64_image}"
+                    }
+                },
+                {
+                    "type": "text",
+                    "text": "Explain what is written in the image from an educational Point of View."
+                }
+            ]
+        }
+    ]
+
+    # Make the API call to Groq
+    completion = client.chat.completions.create(
+        model="llama-3.2-11b-vision-preview",
+        messages=messages,
+        temperature=0,  # Set to 0 for more deterministic results
+        max_tokens=1024,
+        top_p=1,
+        stream=False,
+        stop=None,
+    )
+
+    # Extract the OCR result from the response
+    ocr_result = completion.choices[0].message.content
+
+    return {"ocr_result": ocr_result}
+
+def extract_text_from_pdf(content):
+    pdf_reader = PyPDF2.PdfReader(io.BytesIO(content))
+    text = ""
+    for page in pdf_reader.pages:
+        text += page.extract_text()
+    return text
+
+def extract_text_from_pptx(content):
+    prs = Presentation(io.BytesIO(content))
+    text = ""
+    for slide in prs.slides:
+        for shape in slide.shapes:
+            if hasattr(shape, 'text'):
+                text += shape.text + "\n"
+    return text
+
+def summarize_text(text):
+    prompt = f"Summarize the following text:\n\n{text[:4000]}..."  # Truncate to 4000 characters to fit within token limit
+    
+    chat_completion = client.chat.completions.create(
+        messages=[
+            {
+                "role": "user",
+                "content": prompt,
+            }
+        ],
+        model="llama3-8b-8192",
+    )
+    
+    return chat_completion.choices[0].message.content
+def generate_important_questions(text):
+    prompt = f"Generate 5 important questions based on the following text:\n\n{text[:4000]}..."  # Truncate to 4000 characters to fit within token limit
+    
+    chat_completion = client.chat.completions.create(
+        messages=[
+            {
+                "role": "user",
+                "content": prompt,
+            }
+        ],
+        model="llama3-8b-8192",
+    )
+    
+    return chat_completion.choices[0].message.content
+
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=8000)
diff --git a/requirements.txt b/requirements.txt
@@ -0,0 +1,24 @@
+annotated-types==0.7.0
+anyio==4.6.2.post1
+certifi==2024.8.30
+click==8.1.7
+distro==1.9.0
+fastapi==0.115.2
+groq==0.11.0
+h11==0.14.0
+httpcore==1.0.6
+httpx==0.27.2
+idna==3.10
+lxml==5.3.0
+mangum==0.19.0
+pillow==11.0.0
+pydantic==2.9.2
+pydantic_core==2.23.4
+PyPDF2==3.0.1
+python-multipart==0.0.12
+python-pptx==1.0.2
+sniffio==1.3.1
+starlette==0.40.0
+typing_extensions==4.12.2
+uvicorn==0.31.1
+XlsxWriter==3.2.0