Animesh-Ghosh · March 15, 2026 10:18
diff --git a/chat.link b/chat.link
 https://chatgpt.com/share/69b63c23-159c-8009-8c98-04a162d02052
diff --git a/e2e_results.json b/e2e_results.json
 [
  {
    "idx": 1,
    "question": "What are the revenue figures for Meta for Q1, Q2 and Q3?",
    "expected": "Q2 2024: $39.1B \n\nQ3 2024: $40.6B \n\nQ1 2025: $42.3B",
    "generated": "Q1 2025: $42.3B, Q2 2024: $39.1B, Q3 2024: $40.6B",
    "doc_name": "META-Q1-2025-Earnings-Call-Transcript-1.pdf",
    "confidence": "high",
    "fuzzy_sim": 0.3,
    "semantic_sim": 0.995417594909668,
    "doc_match": 1.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 2,
    "question": "What was KFIN's revenue in 2021?",
    "expected": "Rs. 4586550000",
    "generated": "Rs. 4586550000",
    "doc_name": "1649061896992.PDF",
    "confidence": "high",
    "fuzzy_sim": 1.0,
    "semantic_sim": 1.0,
    "doc_match": 1.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 3,
    "question": "What metrics helped CCI determine if the combination would be anticompetitive?",
    "expected": "The CCI used the Herfindahl Hirschman Index to assess market concentration",
    "generated": "The CCI used the Herfindahl Hirschman Index to assess market concentration.",
    "doc_name": "4. C-2015-07-288.pdf",
    "confidence": "high",
    "fuzzy_sim": 0.9932885906040269,
    "semantic_sim": 0.9943408966064453,
    "doc_match": 1.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 4,
    "question": "What was the bench in the Eastman Kodak Case?",
    "expected": "BLACKMUN, J., delivered the opinion of the Court, in which REHNQUIST, C. J., and WHITE, STEVENS, KENNEDY, and SOUTER, JJ., joined. SCALIA, J., filed a dissenting opinion, in which O\u2019CONNOR and THOMAS, JJ., joined.",
    "generated": "The bench in the Eastman Kodak Case is not explicitly mentioned in the provided context. However, it can be inferred that the case was heard by the Supreme Court of the United States as indicated by '504 U.S. 451 (1992)' which is a citation format for Supreme Court cases.",
    "doc_name": "Eastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992) .pdf",
    "confidence": "medium",
    "fuzzy_sim": 0.024742268041237112,
    "semantic_sim": 0.7343320250511169,
    "doc_match": 1.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 5,
    "question": "How many SCOTUS cases are in the set? Name them.",
    "expected": "There are 5 cases\nBell Atlantic Corp. v. Twombly, 550 U.S. 544 (2007)\nEastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992)\nStandard Oil Co. of New Jersey v. United States, 221 U.S. 1 (1911)\nUnited States v. Socony-Vacuum Oil Co., Inc., 310 U.S. 150 (1940)\nBrown Shoe Co., Inc. v. United States, 370 U.S. 294 (1962) ",
    "generated": "There are 4 cases in the set. Bell Atlantic Corp. v. Twombly, 550 U.S. 544 (2007), Eastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992), Standard Oil Co. of New Jersey v. United States, 221 U.S. 1 (1911), and United States v. Socony-Vacuum Oil Co., Inc., 310 U.S. 150 (1940).",
    "doc_name": "Testing Set Questions.xlsx",
    "confidence": "high",
    "fuzzy_sim": 0.8394276629570747,
    "semantic_sim": 0.9673870205879211,
    "doc_match": 0.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 6,
    "question": "What is the governing law in the NVCA IRA?",
    "expected": "Delaware",
    "generated": "The governing law for the NVCA Investor Rights Agreement is the internal law of the State of Delaware.",
    "doc_name": "NVCA-Model-Document-Investor-Rights-Agreement.docx",
    "confidence": "high",
    "fuzzy_sim": 0.14545454545454545,
    "semantic_sim": 0.7153719663619995,
    "doc_match": 1.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 7,
    "question": "If Pristine were to acquire an indian company that had turnover of 1Cr and no assets, would it have to notify the deal to the CCI?",
    "expected": "The thresholds for notification are:\nAssets of the acquirer and target > INR 25 Billion; or\nRevenue of the acquirer and target > INR 75 Billion\n\n\nPristine's revenue in 2021 was INR 5 billion; and total assets were INR 10 billion. Therefore, even after adding the turnover and the asset figures of the target, a notification will not be required.",
    "generated": "No, Pristine would not have to notify the deal to the CCI as the thresholds for notification are Assets of the acquirer and target > INR 25 Billion; or Revenue of the acquirer and target > INR 75 Billion.",
    "doc_name": "Testing Set Questions.xlsx",
    "confidence": "high",
    "fuzzy_sim": 0.38979963570127507,
    "semantic_sim": 0.8773993253707886,
    "doc_match": 0.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 8,
    "question": "Which questions in the Testing Set Questions has \u201cDelaware\u201d as an answer",
    "expected": "The question is \u201cWhat is the governing law in the NVCA IRA\u201d? ",
    "generated": "The Delaware General Corporation Law (DGCL)",
    "doc_name": "NVCA-Model-Document-Investor-Rights-Agreement.docx",
    "confidence": "high",
    "fuzzy_sim": 0.2912621359223301,
    "semantic_sim": 0.786303699016571,
    "doc_match": 0.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 9,
    "question": "Which question has an answer as \u20b94586550000",
    "expected": "The question is \u201cWhat was KFIN's revenue in 2021?\u201d",
    "generated": "NOT_FOUND",
    "doc_name": "1649061896992.PDF",
    "confidence": "low",
    "fuzzy_sim": 0.1694915254237288,
    "semantic_sim": 0.7544689774513245,
    "doc_match": 0.0,
    "chunks_retrieved": 5
  },
  {
    "idx": 10,
    "question": "Does any question has reference to document 4. C-2015-07-288.pdf, p12",
    "expected": "It's \u201cWhat metrics helped CCI determine if the combination would be anticompetitive?\u201d",
    "generated": "NOT_FOUND",
    "doc_name": "None",
    "confidence": "low",
    "fuzzy_sim": 0.1276595744680851,
    "semantic_sim": 0.8461841940879822,
    "doc_match": 0.0,
    "chunks_retrieved": 5
  }
 ]
diff --git a/faiss_migration_plan.md b/faiss_migration_plan.md
diff --git a/lucio api swagger b/lucio api swagger
 https://luciohackathon.purplewater-eec0a096.centralindia.azurecontainerapps.io/docs#/Submissions/submit_submissions_post
diff --git a/streaming_embedding_plan.md b/streaming_embedding_plan.md
	[
	{
	"idx": 1,
	"question": "What are the revenue figures for Meta for Q1, Q2 and Q3?",
	"expected": "Q2 2024: $39.1B \n\nQ3 2024: $40.6B \n\nQ1 2025: $42.3B",
	"generated": "Q1 2025: $42.3B, Q2 2024: $39.1B, Q3 2024: $40.6B",
	"doc_name": "META-Q1-2025-Earnings-Call-Transcript-1.pdf",
	"confidence": "high",
	"fuzzy_sim": 0.3,
	"semantic_sim": 0.995417594909668,
	"doc_match": 1.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 2,
	"question": "What was KFIN's revenue in 2021?",
	"expected": "Rs. 4586550000",
	"generated": "Rs. 4586550000",
	"doc_name": "1649061896992.PDF",
	"confidence": "high",
	"fuzzy_sim": 1.0,
	"semantic_sim": 1.0,
	"doc_match": 1.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 3,
	"question": "What metrics helped CCI determine if the combination would be anticompetitive?",
	"expected": "The CCI used the Herfindahl Hirschman Index to assess market concentration",
	"generated": "The CCI used the Herfindahl Hirschman Index to assess market concentration.",
	"doc_name": "4. C-2015-07-288.pdf",
	"confidence": "high",
	"fuzzy_sim": 0.9932885906040269,
	"semantic_sim": 0.9943408966064453,
	"doc_match": 1.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 4,
	"question": "What was the bench in the Eastman Kodak Case?",
	"expected": "BLACKMUN, J., delivered the opinion of the Court, in which REHNQUIST, C. J., and WHITE, STEVENS, KENNEDY, and SOUTER, JJ., joined. SCALIA, J., filed a dissenting opinion, in which O\u2019CONNOR and THOMAS, JJ., joined.",
	"generated": "The bench in the Eastman Kodak Case is not explicitly mentioned in the provided context. However, it can be inferred that the case was heard by the Supreme Court of the United States as indicated by '504 U.S. 451 (1992)' which is a citation format for Supreme Court cases.",
	"doc_name": "Eastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992) .pdf",
	"confidence": "medium",
	"fuzzy_sim": 0.024742268041237112,
	"semantic_sim": 0.7343320250511169,
	"doc_match": 1.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 5,
	"question": "How many SCOTUS cases are in the set? Name them.",
	"expected": "There are 5 cases\nBell Atlantic Corp. v. Twombly, 550 U.S. 544 (2007)\nEastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992)\nStandard Oil Co. of New Jersey v. United States, 221 U.S. 1 (1911)\nUnited States v. Socony-Vacuum Oil Co., Inc., 310 U.S. 150 (1940)\nBrown Shoe Co., Inc. v. United States, 370 U.S. 294 (1962) ",
	"generated": "There are 4 cases in the set. Bell Atlantic Corp. v. Twombly, 550 U.S. 544 (2007), Eastman Kodak Co. v. Image Technical Services, Inc., 504 U.S. 451 (1992), Standard Oil Co. of New Jersey v. United States, 221 U.S. 1 (1911), and United States v. Socony-Vacuum Oil Co., Inc., 310 U.S. 150 (1940).",
	"doc_name": "Testing Set Questions.xlsx",
	"confidence": "high",
	"fuzzy_sim": 0.8394276629570747,
	"semantic_sim": 0.9673870205879211,
	"doc_match": 0.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 6,
	"question": "What is the governing law in the NVCA IRA?",
	"expected": "Delaware",
	"generated": "The governing law for the NVCA Investor Rights Agreement is the internal law of the State of Delaware.",
	"doc_name": "NVCA-Model-Document-Investor-Rights-Agreement.docx",
	"confidence": "high",
	"fuzzy_sim": 0.14545454545454545,
	"semantic_sim": 0.7153719663619995,
	"doc_match": 1.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 7,
	"question": "If Pristine were to acquire an indian company that had turnover of 1Cr and no assets, would it have to notify the deal to the CCI?",
	"expected": "The thresholds for notification are:\nAssets of the acquirer and target > INR 25 Billion; or\nRevenue of the acquirer and target > INR 75 Billion\n\n\nPristine's revenue in 2021 was INR 5 billion; and total assets were INR 10 billion. Therefore, even after adding the turnover and the asset figures of the target, a notification will not be required.",
	"generated": "No, Pristine would not have to notify the deal to the CCI as the thresholds for notification are Assets of the acquirer and target > INR 25 Billion; or Revenue of the acquirer and target > INR 75 Billion.",
	"doc_name": "Testing Set Questions.xlsx",
	"confidence": "high",
	"fuzzy_sim": 0.38979963570127507,
	"semantic_sim": 0.8773993253707886,
	"doc_match": 0.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 8,
	"question": "Which questions in the Testing Set Questions has \u201cDelaware\u201d as an answer",
	"expected": "The question is \u201cWhat is the governing law in the NVCA IRA\u201d? ",
	"generated": "The Delaware General Corporation Law (DGCL)",
	"doc_name": "NVCA-Model-Document-Investor-Rights-Agreement.docx",
	"confidence": "high",
	"fuzzy_sim": 0.2912621359223301,
	"semantic_sim": 0.786303699016571,
	"doc_match": 0.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 9,
	"question": "Which question has an answer as \u20b94586550000",
	"expected": "The question is \u201cWhat was KFIN's revenue in 2021?\u201d",
	"generated": "NOT_FOUND",
	"doc_name": "1649061896992.PDF",
	"confidence": "low",
	"fuzzy_sim": 0.1694915254237288,
	"semantic_sim": 0.7544689774513245,
	"doc_match": 0.0,
	"chunks_retrieved": 5
	},
	{
	"idx": 10,
	"question": "Does any question has reference to document 4. C-2015-07-288.pdf, p12",
	"expected": "It's \u201cWhat metrics helped CCI determine if the combination would be anticompetitive?\u201d",
	"generated": "NOT_FOUND",
	"doc_name": "None",
	"confidence": "low",
	"fuzzy_sim": 0.1276595744680851,
	"semantic_sim": 0.8461841940879822,
	"doc_match": 0.0,
	"chunks_retrieved": 5
	}
	]
No results found