Spaces:

seanpedrickcase
/

Light-PDF-Web-QA-Chatbot

Running

Light-PDF-Web-QA-Chatbot / test /test_module.py

Changed embedding model to mixed bread xsmall, optimised related functions in general. Updated Gemini model references.

d3a9db3 3 months ago

1.24 kB

	# ---
	# jupyter:
	# jupytext:
	# formats: ipynb,py:light
	# text_representation:
	# extension: .py
	# format_name: light
	# format_version: '1.5'
	# jupytext_version: 1.15.0
	# kernelspec:
	# display_name: Python 3 (ipykernel)
	# language: python
	# name: python3
	# ---

	# +
	import pytest
	import gradio as gr
	from ..tools.ingest import *
	from ..tools.chatfuncs import *

	def test_read_docx():
	content = read_docx('sample.docx')
	assert content == "Hello, World!"


	# +
	def test_parse_file():
	# Assuming these files exist and you know their content
	files = ['sample.docx', 'sample.pdf', 'sample.txt', 'sample.html']
	contents = parse_file(files)

	assert contents['sample.docx'] == 'Hello, World!'
	assert contents['sample.pdf'] == 'Hello, World!'
	assert contents['sample.txt'] == 'Hello, World!'
	assert contents['sample.html'] == 'Hello, World!'

	def test_unsupported_file_type():
	files = ['sample.unknown']
	contents = parse_file(files)
	assert contents['sample.unknown'].startswith('Unsupported file type:')

	def test_input_validation():
	with pytest.raises(ValueError, match="Expected a list of file paths."):
	parse_file('single_file_path.txt')