preliminary results of prompt engineering

54ede653 · nasredine · 54ede653 · 54ede653 · 54ede653 · 54ede653
Commit 54ede653 authored 9 months ago by nasredine
--- a/.gitignore
+++ b/.gitignore
+.env
+myenv/*
+data/*
+akn4eu_generation_open_llms.ipynb
--- a/deepinfra.py
+++ b/deepinfra.py
+import requests
+import json
+import time
+import os
+
+def call_api(input_text, token, model_name, max_new_tokens):
+    start_time = time.time()  # Capture start time
+    url = "https://api.deepinfra.com/v1/inference/" + model_name
+    headers = {
+        "Content-Type": "application/json",
+        "Authorization": "Bearer " + token
+    }
+    data = {
+        "input": input_text,
+        "max_new_tokens": max_new_tokens
+    }
+    response = requests.post(url, headers=headers, data=json.dumps(data))
+    end_time = time.time()  # Capture end time
+    execution_time = end_time - start_time  # Calculate execution time
+    return response.json(), execution_time
+
+def save_result_to_file(model_name, result, execution_time):
+    safe_model_name = model_name.replace("/", "_")
+    with open(f'{safe_model_name}.json', 'w') as file:
+        result_with_time = {
+            "result": result,
+            "execution_time": execution_time
+        }
+        json.dump(result_with_time, file)
+
+
+def extract_and_save_xml(model_name, base_path='data/responses', output_base_path='data/xml'):
+    # Replace slashes with underscores to match the file naming convention for filenames
+    safe_model_name = model_name.replace("/", "_")
+    input_filename = os.path.join(base_path, f'{safe_model_name}.json')
+    output_filename = os.path.join(output_base_path, f'{safe_model_name}.xml')
+    
+    try:
+        with open(input_filename, 'r') as file:
+            content = json.load(file)
+            generated_text = content["result"]["results"][0]["generated_text"]
+
+        # Ensure the output directory exists
+        os.makedirs(output_base_path, exist_ok=True)
+        
+        # Save the extracted XML to a new file
+        with open(output_filename, 'w') as file:
+            file.write(generated_text)
+        
+        print(f"XML saved to {output_filename}")
+    except FileNotFoundError:
+        print(f"File not found: {input_filename}")
+    except KeyError:
+        print(f"Invalid content format in {input_filename}")
+    
+#######################
+
+
+# Example usage
+input_text = open('/home/nasredine/dev/work/ai4xml/playground/data/prompts/text_xml_translation.prompt', 'r').read()
+
+# Token (assuming the same token can be used for all models for simplicity)
+token = "CtFHbaHNwqVaoj5N8mdcBTgqa8YbKMDC"
+
+# List of models with their corresponding max_new_tokens values
+models = [
+    {"name": "mistralai/Mixtral-8x7B-Instruct-v0.1", "max_new_tokens": 30000},
+    # {"name": "mistralai/Mistral-7B-Instruct-v0.1", "max_new_tokens": 30000},
+    # {"name": "meta-llama/Llama-2-7b-chat-hf", "max_new_tokens": 2000},
+    # {"name": "meta-llama/Llama-2-70b-chat-hf", "max_new_tokens": 2000},
+    # {"name": "codellama/CodeLlama-34b-Instruct-hf", "max_new_tokens": 10000},
+	# {"name": "bigcode/starcoder", "max_new_tokens": 30000},
+ 	# {"name": "Salesforce/codegen-16B-mono", "max_new_tokens": 10000},
+]
+
+for model in models:
+    model_name = model["name"]
+    max_new_tokens = model["max_new_tokens"]
+    result, execution_time = call_api(input_text, token, model_name, max_new_tokens)
+    
+    # Save the result and execution time to a file named after the model
+    save_result_to_file(model_name, result, execution_time)
+    print(f"Results and execution time for {model_name} saved.")
+    
+for model in models:
+    model_name = model["name"]
+    xml_result = extract_and_save_xml(model_name)
+    if xml_result:
+        print(f"XML result for {model_name}:")
+        print(xml_result)
+        # Here you can further process the XML result or save it as needed
+    else:
+        print(f"No XML result available for {model_name}")
--- a/evaluation.ipynb
+++ b/evaluation.ipynb
--- a/prompt_engineering_akn4eu_documentation.ipynb
+++ b/prompt_engineering_akn4eu_documentation.ipynb
--- a/prompt_engineering_deepinfra.ipynb
+++ b/prompt_engineering_deepinfra.ipynb
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install langchain\n",
+    "!pip install python-dotenv\n",
+    "!pip install langchain-fireworks\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "from langchain.chains import LLMChain\n",
+    "from langchain_core.output_parsers import StrOutputParser\n",
+    "from langchain_fireworks import Fireworks \n",
+    "\n",
+    "load_dotenv()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "api_key = os.getenv(\"FIREWORKS_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "MAX_TOKENS = 4000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "models = [\n",
+    "     'accounts/fireworks/models/starcoder-7b', \n",
+    "     'accounts/fireworks/models/starcoder-16b', \n",
+    "     'accounts/fireworks/models/llama-v2-13b-code-instruct', \n",
+    "     'accounts/fireworks/models/llama-v2-34b-code-instruct',\n",
+    "     'accounts/fireworks/models/llama-v2-70b-code-instruct',\n",
+    "          ]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 45,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Processing model: starcoder-7b\n",
+      "Processing model: starcoder-16b\n",
+      "Processing model: llama-v2-13b-code-instruct\n",
+      "Processing model: llama-v2-34b-code-instruct\n",
+      "Processing model: llama-v2-70b-code-instruct\n"
+     ]
+    }
+   ],
+   "source": [
+    "shots = [0,1]  # Add more shot numbers as needed\n",
+    "\n",
+    "for shot in shots:\n",
+    "    base_path = f'data/prompts/{shot}-shot'\n",
+    "    prompt = open(f'{base_path}/prompt.txt', 'r').read()\n",
+    "    \n",
+    "    for model in models:\n",
+    "        model_name = model.split('/')[-1]\n",
+    "        print(f'Processing model: {model_name}')\n",
+    "        \n",
+    "        llm = Fireworks(\n",
+    "\t\t\tfireworks_api_key=api_key,\n",
+    "\t\t\tmodel=model,\n",
+    "\t\t\tmax_tokens=MAX_TOKENS)\n",
+    "        result = llm.invoke(prompt)\n",
+    "        file_path = f'{base_path}/results/{model_name}.fireworks.ai.txt'\n",
+    "        \n",
+    "        with open(file_path, 'w') as file:\n",
+    "            file.write(result)  \n"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
+%% Cell type:code id: tags:
+
+``` python
+!pip install langchain
+!pip install python-dotenv
+!pip install langchain-fireworks
+
+```
+
+%% Cell type:code id: tags:
+
+``` python
+import os
+from dotenv import load_dotenv
+from langchain.chains import LLMChain
+from langchain_core.output_parsers import StrOutputParser
+from langchain_fireworks import Fireworks
+
+load_dotenv()
+```
+
+%% Output
+
+    True
+
+%% Cell type:code id: tags:
+
+``` python
+api_key = os.getenv("FIREWORKS_API_KEY")
+```
+
+%% Cell type:code id: tags:
+
+``` python
+MAX_TOKENS = 4000
+```
+
+%% Cell type:code id: tags:
+
+``` python
+models = [
+     'accounts/fireworks/models/starcoder-7b',
+     'accounts/fireworks/models/starcoder-16b',
+     'accounts/fireworks/models/llama-v2-13b-code-instruct',
+     'accounts/fireworks/models/llama-v2-34b-code-instruct',
+     'accounts/fireworks/models/llama-v2-70b-code-instruct',
+          ]
+```
+
+%% Cell type:code id: tags:
+
+``` python
+shots = [0,1]  # Add more shot numbers as needed
+
+for shot in shots:
+    base_path = f'data/prompts/{shot}-shot'
+    prompt = open(f'{base_path}/prompt.txt', 'r').read()
+
+    for model in models:
+        model_name = model.split('/')[-1]
+        print(f'Processing model: {model_name}')
+
+        llm = Fireworks(
+			fireworks_api_key=api_key,
+			model=model,
+			max_tokens=MAX_TOKENS)
+        result = llm.invoke(prompt)
+        file_path = f'{base_path}/results/{model_name}.fireworks.ai.txt'
+
+        with open(file_path, 'w') as file:
+            file.write(result)
+```
+
+%% Output
+
+    Processing model: starcoder-7b
+    Processing model: starcoder-16b
+    Processing model: llama-v2-13b-code-instruct
+    Processing model: llama-v2-34b-code-instruct
+    Processing model: llama-v2-70b-code-instruct
--- a/prompt_engineering_fireworks.ai copy 2.ipynb
+++ b/prompt_engineering_fireworks.ai copy 2.ipynb
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Install necessary packages\n",
+    "Langchain supports many LLM inference providers, including Fireworks."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install langchain\n",
+    "!pip install python-dotenv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 50,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "import requests\n",
+    "import json\n",
+    "\n",
+    "load_dotenv()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### API KEY\n",
+    "* register and get api key from : https://fireworks.ai/api-keys\n",
+    "* put the key in the file .env file in FIREWORKS_API_KEY variable"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "api_key = os.getenv(\"FIREWORKS_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# maximum number of tokens to generate by the model\n",
+    "max_tokens = {}\n",
+    "max_tokens[0] = 1000\n",
+    "max_tokens[1] = 1000\n",
+    "max_tokens[2] = 2000"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Prompting Models"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 49,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "models = [\n",
+    "     'accounts/fireworks/models/starcoder-7b', \n",
+    "     'accounts/fireworks/models/starcoder-16b', \n",
+    "     'accounts/fireworks/models/llama-v2-13b-code-instruct', \n",
+    "     'accounts/fireworks/models/llama-v2-34b-code-instruct',\n",
+    "     'accounts/fireworks/models/llama-v2-70b-code-instruct',\n",
+    "     'accounts/fireworks/models/mixtral-8x7b-instruct',\n",
+    "          ]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "\n",
+    "def send_fireworks_chat_request(model,messages, api_key, max_tokens=4096, \n",
+    "                                temperature=0.6, top_p=1,top_k=40, \n",
+    "                                frequency_penalty=0, \n",
+    "                                presence_penalty=0, \n",
+    "                                ):\n",
+    "\n",
+    "    url = \"https://api.fireworks.ai/inference/v1/chat/completions\"\n",
+    "    payload = {\n",
+    "        \"model\": model,\n",
+    "        \"messages\": messages,\n",
+    "        \"max_tokens\": max_tokens,\n",
+    "        \"temperature\": temperature,\n",
+    "        \"top_p\": top_p,\n",
+    "        \"frequency_penalty\": frequency_penalty,\n",
+    "        \"presence_penalty\": presence_penalty,\n",
+    "        \"top_k\": top_k,\n",
+    "    }\n",
+    "    headers = {\n",
+    "        \"Accept\": \"application/json\",\n",
+    "        \"Content-Type\": \"application/json\",\n",
+    "        \"Authorization\": f\"Bearer {api_key}\"\n",
+    "    }\n",
+    "    \n",
+    "    response = requests.post(url, json=payload, headers=headers)\n",
+    "    return response.json()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 51,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "system_message = \"\"\"\n",
+    "You are AKN4EU XML formation converter. \n",
+    "You receive plain text documents and convert them to XML. \n",
+    "Return only the final XML document converted from the text.\n",
+    "The user gives some examples of XML documents.\n",
+    "\"\"\"\n",
+    "\n",
+    "\n",
+    "assistant_message = \"\"\"\n",
+    "EUROPEAN COMMISSION\n",
+    "Brussels, 21.12.2016\n",
+    "2016/0411 (COD)\n",
+    "Proposal for a\n",
+    "REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE\n",
+    "COUNCIL\n",
+    "amending Regulation (EC)\n",
+    "No 1008/2008 on common rules for the operation of air services in the\n",
+    "Community\n",
+    "EN\n",
+    "\n",
+    "\"\"\"\n",
+    "\n",
+    "user_message_1 = \"\"\"\n",
+    "Convert plain text of following coverpage to AKN4EU XML format.\n",
+    "\n",
+    "\n",
+    "EUROPEAN COMMISSION\n",
+    "Brussels, 21.12.2016\n",
+    "2016/0411 (COD)\n",
+    "Proposal for a\n",
+    "REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE\n",
+    "COUNCIL\n",
+    "amending Regulation (EC)\n",
+    "No 1008/2008 on common rules for the operation of air services in the\n",
+    "Community\n",
+    "EN\n",
+    "\"\"\"\n",
+    "\n",
+    "assistant_message = \"\"\"\n",
+    "<coverPage>\n",
+    "\t<container name=\"logo\">\n",
+    "\t\t<p><img src=\"EC.png\" alt=\"EUROPEAN COMMISSION\"/></p>\n",
+    "\t</container>\n",
+    "\t<container name=\"actingEntity\">\n",
+    "\t\t<p><organization refersTo=\"~_COM\">EUROPEAN COMMISSION</organization></p>\n",
+    "\t</container>\n",
+    "\t<container name=\"mainDoc\">\n",
+    "\t\t<block name=\"placeAndDate\">\n",
+    "\t\t\t<location refersTo=\"~_BEL_BRU\">Brussels</location>, <date date=\"2016-12-21\">21.12.2016</date>\n",
+    "\t\t</block>\n",
+    "\t</container>\n",
+    "\t<container name=\"procedureIdentifier\">\n",
+    "\t\t<p><docketNumber refersTo=\"~_procedure_2016_411\">2016/0411 (COD)</docketNumber></p>\n",
+    "\t</container>\n",
+    "\t<longTitle>\n",
+    "\t\t<p><docStage>Proposal for a</docStage>\n",
+    "\t\t\t<docType refersTo=\"~_REG\">REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE\n",
+    "\t\t\t\tCOUNCIL</docType>\n",
+    "\t\t\t<docPurpose>amending <ref href=\"http://data.europa.eu/eli/reg/2008/1008\">Regulation (EC)\n",
+    "\t\t\t\t\tNo 1008/2008 on common rules for the operation of air services in the\n",
+    "\t\t\t\tCommunity</ref></docPurpose></p>\n",
+    "\t</longTitle>\n",
+    "\t<container name=\"mainDocLanguage\">\n",
+    "\t\t<p><inline name=\"language\" refersTo=\"~_FRBRlanguage\">EN</inline></p>\n",
+    "\t</container>\n",
+    "</coverPage>\n",
+    "\"\"\"\n",
+    "\n",
+    "user_message_2 = \"\"\"\n",
+    "Convert plain text of following coverpage to AKN4EU XML format.\n",
+    "\n",
+    "EUROPEAN COMMISSION\n",
+    "Brussels, 21.12.2017\n",
+    "2012/0412 (COD)\n",
+    "Proposal for a\n",
+    "REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE COUNCIL amending Regulation (EC)\n",
+    "No 1009/2009 on common rules for the operation of air services in the Community\n",
+    "EN\n",
+    "\"\"\"\n",
+    "\n",
+    "messages = [\n",
+    "    {\"role\": \"system\", \"content\": system_message},\n",
+    "    {\"role\": \"user\", \"content\": user_message_1},\n",
+    "    {\"role\": \"assistant\", \"content\": assistant_message},\n",
+    "    {\"role\": \"user\", \"content\": user_message_2},\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 53,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'error': {'object': 'error',\n",
+       "  'type': 'invalid_request_error',\n",
+       "  'message': 'model is missing conversation_config, please use /completions API instead'}}"
+      ]
+     },
+     "execution_count": 53,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "KeyError",
+     "evalue": "'choices'",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[52], line 2\u001b[0m\n\u001b[1;32m      1\u001b[0m response \u001b[38;5;241m=\u001b[39m send_fireworks_chat_request(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124maccounts/fireworks/models/starcoder-7b\u001b[39m\u001b[38;5;124m\"\u001b[39m,messages, api_key)\n\u001b[0;32m----> 2\u001b[0m text \u001b[38;5;241m=\u001b[39m \u001b[43mresponse\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mchoices\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m]\u001b[49m[\u001b[38;5;241m0\u001b[39m][\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mtext\u001b[39m\u001b[38;5;124m'\u001b[39m]\n\u001b[1;32m      4\u001b[0m \u001b[38;5;28mprint\u001b[39m(text)\n",
+      "\u001b[0;31mKeyError\u001b[0m: 'choices'"
+     ]
+    }
+   ],
+   "source": [
+    "response = send_fireworks_chat_request(\"accounts/fireworks/models/starcoder-7b\",messages, api_key)\n",
+    "text = response['choices'][0]['text']\n",
+    "\n",
+    "print(text)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "shots = [0,1,2]\n",
+    "\n",
+    "for shot in shots:\n",
+    "    print(f'Processing shot: {shot}')\n",
+    "    \n",
+    "    base_path = f'data/prompts/{shot}-shot'\n",
+    "    prompt = open(f'{base_path}/prompt.txt', 'r').read()\n",
+    "    \n",
+    "    for model in models:\n",
+    "        model_name = model.split('/')[-1]\n",
+    "        print(f'Processing model: {model_name}')\n",
+    "        \n",
+    "        results_dir = f'{base_path}/results'\n",
+    "        \n",
+    "        if not os.path.exists(results_dir):\n",
+    "            os.makedirs(results_dir)\n",
+    "\n",
+    "        \n",
+    "        file_path = f'{results_dir}/{model_name}.fireworks.ai.txt'\n",
+    "        \n",
+    "        # Check if the result file already exists\n",
+    "        if os.path.exists(file_path):\n",
+    "            print('Skipping...')\n",
+    "            continue\n",
+    "\n",
+    "        llm = Fireworks(\n",
+    "\t\t\tfireworks_api_key=api_key,\n",
+    "\t\t\tmodel=model,\n",
+    "\t\t\tmax_tokens=max_tokens[shot])\n",
+    "        result = llm.invoke(prompt)\n",
+    "        \n",
+    "        with open(file_path, 'w') as file:\n",
+    "            file.write(result)  \n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### XML Extraction from results"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import re\n",
+    "\n",
+    "base_dir = 'data/prompts'\n",
+    "shots = [0, 1, 2]\n",
+    "\n",
+    "for shot in shots:\n",
+    "    results_path = os.path.join(base_dir, f'{shot}-shot', 'results')\n",
+    "    results_xml_path = os.path.join(base_dir, f'{shot}-shot', 'results-xml')\n",
+    "\n",
+    "    # Ensure the results-xml directory exists\n",
+    "    if not os.path.exists(results_xml_path):\n",
+    "        os.makedirs(results_xml_path)\n",
+    "    \n",
+    "    # Loop through each result file in the results directory\n",
+    "    if os.path.exists(results_path) and os.path.isdir(results_path):\n",
+    "        for result_file in os.listdir(results_path):\n",
+    "            file_path = os.path.join(results_path, result_file)\n",
+    "            if file_path.endswith('.fireworks.ai.txt'):\n",
+    "                with open(file_path, 'r') as file:\n",
+    "                    result_content = file.read()\n",
+    "                \n",
+    "                # Regular expression to find content enclosed by <coverPage>...</coverPage>\n",
+    "                # This pattern ignores any text outside the XML tags\n",
+    "                start_tag = \"<coverPage>\"\n",
+    "                end_tag = \"</coverPage>\"\n",
+    "                \n",
+    "                # Finding the last occurrence of the start_tag and the last occurrence of the end_tag\n",
+    "                start = result_content.rfind(start_tag)\n",
+    "                end = result_content.rfind(end_tag) + len(end_tag)\n",
+    "                \n",
+    "                # If the start tag or end tag is not found, return an empty string or a specific message\n",
+    "                if start == -1 or end == -1:\n",
+    "                    print(f\"No XML content found in {result_file}\")\n",
+    "                \n",
+    "                xml_content = result_content[start:end]\n",
+    "                \n",
+    "                    \n",
+    "                    # Prepares the filename and path for saving the extracted XML\n",
+    "                xml_file_name = result_file.replace('.txt', '.xml')\n",
+    "                xml_file_path = os.path.join(results_xml_path, xml_file_name)\n",
+    "                    \n",
+    "                    # Writes the XML content to a new file in the results-xml directory\n",
+    "                with open(xml_file_path, 'w') as xml_file:\n",
+    "                    xml_file.write(xml_content)\n",
+    "                print(f'Extracted and saved XML for {xml_file_name}')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
+%% Cell type:markdown id: tags:
+
+### Install necessary packages
+Langchain supports many LLM inference providers, including Fireworks.
+
+%% Cell type:code id: tags:
+
+``` python
+!pip install langchain
+!pip install python-dotenv
+```
+
+%% Cell type:code id: tags:
+
+``` python
+import os
+from dotenv import load_dotenv
+import requests
+import json
+
+load_dotenv()
+```
+
+%% Output
+
+    True
+
+%% Cell type:markdown id: tags:
+
+### API KEY
+* register and get api key from : https://fireworks.ai/api-keys
+* put the key in the file .env file in FIREWORKS_API_KEY variable
+
+%% Cell type:code id: tags:
+
+``` python
+api_key = os.getenv("FIREWORKS_API_KEY")
+```
+
+%% Cell type:code id: tags:
+
+``` python
+# maximum number of tokens to generate by the model
+max_tokens = {}
+max_tokens[0] = 1000
+max_tokens[1] = 1000
+max_tokens[2] = 2000
+```
+
+%% Cell type:markdown id: tags:
+
+### Prompting Models
+
+%% Cell type:code id: tags:
+
+``` python
+models = [
+     'accounts/fireworks/models/starcoder-7b',
+     'accounts/fireworks/models/starcoder-16b',
+     'accounts/fireworks/models/llama-v2-13b-code-instruct',
+     'accounts/fireworks/models/llama-v2-34b-code-instruct',
+     'accounts/fireworks/models/llama-v2-70b-code-instruct',
+     'accounts/fireworks/models/mixtral-8x7b-instruct',
+          ]
+```
+
+%% Cell type:code id: tags:
+
+``` python
+
+
+def send_fireworks_chat_request(model,messages, api_key, max_tokens=4096,
+                                temperature=0.6, top_p=1,top_k=40,
+                                frequency_penalty=0,
+                                presence_penalty=0,
+                                ):
+
+    url = "https://api.fireworks.ai/inference/v1/chat/completions"
+    payload = {
+        "model": model,
+        "messages": messages,
+        "max_tokens": max_tokens,
+        "temperature": temperature,
+        "top_p": top_p,
+        "frequency_penalty": frequency_penalty,
+        "presence_penalty": presence_penalty,
+        "top_k": top_k,
+    }
+    headers = {
+        "Accept": "application/json",
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {api_key}"
+    }
+
+    response = requests.post(url, json=payload, headers=headers)
+    return response.json()
+```
+
+%% Cell type:code id: tags:
+
+``` python
+
+system_message = """
+You are AKN4EU XML formation converter.
+You receive plain text documents and convert them to XML.
+Return only the final XML document converted from the text.
+The user gives some examples of XML documents.
+"""
+
+
+assistant_message = """
+EUROPEAN COMMISSION
+Brussels, 21.12.2016
+2016/0411 (COD)
+Proposal for a
+REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE
+COUNCIL
+amending Regulation (EC)
+No 1008/2008 on common rules for the operation of air services in the
+Community
+EN
+
+"""
+
+user_message_1 = """
+Convert plain text of following coverpage to AKN4EU XML format.
+
+
+EUROPEAN COMMISSION
+Brussels, 21.12.2016
+2016/0411 (COD)
+Proposal for a
+REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE
+COUNCIL
+amending Regulation (EC)
+No 1008/2008 on common rules for the operation of air services in the
+Community
+EN
+"""
+
+assistant_message = """
+<coverPage>
+	<container name="logo">
+		<p><img src="EC.png" alt="EUROPEAN COMMISSION"/></p>
+	</container>
+	<container name="actingEntity">
+		<p><organization refersTo="~_COM">EUROPEAN COMMISSION</organization></p>
+	</container>
+	<container name="mainDoc">
+		<block name="placeAndDate">
+			<location refersTo="~_BEL_BRU">Brussels</location>, <date date="2016-12-21">21.12.2016</date>
+		</block>
+	</container>
+	<container name="procedureIdentifier">
+		<p><docketNumber refersTo="~_procedure_2016_411">2016/0411 (COD)</docketNumber></p>
+	</container>
+	<longTitle>
+		<p><docStage>Proposal for a</docStage>
+			<docType refersTo="~_REG">REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE
+				COUNCIL</docType>
+			<docPurpose>amending <ref href="http://data.europa.eu/eli/reg/2008/1008">Regulation (EC)
+					No 1008/2008 on common rules for the operation of air services in the
+				Community</ref></docPurpose></p>
+	</longTitle>
+	<container name="mainDocLanguage">
+		<p><inline name="language" refersTo="~_FRBRlanguage">EN</inline></p>
+	</container>
+</coverPage>
+"""
+
+user_message_2 = """
+Convert plain text of following coverpage to AKN4EU XML format.
+
+EUROPEAN COMMISSION
+Brussels, 21.12.2017
+2012/0412 (COD)
+Proposal for a
+REGULATION OF THE EUROPEAN PARLIAMENT AND OF THE COUNCIL amending Regulation (EC)
+No 1009/2009 on common rules for the operation of air services in the Community
+EN
+"""
+
+messages = [
+    {"role": "system", "content": system_message},
+    {"role": "user", "content": user_message_1},
+    {"role": "assistant", "content": assistant_message},
+    {"role": "user", "content": user_message_2},
+]
+```
+
+%% Cell type:code id: tags:
+
+``` python
+response
+```
+
+%% Output
+
+    {'error': {'object': 'error',
+      'type': 'invalid_request_error',
+      'message': 'model is missing conversation_config, please use /completions API instead'}}
+
+%% Cell type:code id: tags:
+
+``` python
+response = send_fireworks_chat_request("accounts/fireworks/models/starcoder-7b",messages, api_key)
+text = response['choices'][0]['text']
+
+print(text)
+```
+
+%% Output
+
+    ---------------------------------------------------------------------------
+    KeyError                                  Traceback (most recent call last)
+Cell     In[52], line 2
+          1 response = send_fireworks_chat_request("accounts/fireworks/models/starcoder-7b",messages, api_key)
+    ----> 2 text = response['choices'][0]['text']
+          4 print(text)
+    KeyError: 'choices'
+
+%% Cell type:code id: tags:
+
+``` python
+shots = [0,1,2]
+
+for shot in shots:
+    print(f'Processing shot: {shot}')
+
+    base_path = f'data/prompts/{shot}-shot'
+    prompt = open(f'{base_path}/prompt.txt', 'r').read()
+
+    for model in models:
+        model_name = model.split('/')[-1]
+        print(f'Processing model: {model_name}')
+
+        results_dir = f'{base_path}/results'
+
+        if not os.path.exists(results_dir):
+            os.makedirs(results_dir)
+
+
+        file_path = f'{results_dir}/{model_name}.fireworks.ai.txt'
+
+        # Check if the result file already exists
+        if os.path.exists(file_path):
+            print('Skipping...')
+            continue
+
+        llm = Fireworks(
+			fireworks_api_key=api_key,
+			model=model,
+			max_tokens=max_tokens[shot])
+        result = llm.invoke(prompt)
+
+        with open(file_path, 'w') as file:
+            file.write(result)
+```
+
+%% Cell type:markdown id: tags:
+
+### XML Extraction from results
+
+%% Cell type:code id: tags:
+
+``` python
+import os
+import re
+
+base_dir = 'data/prompts'
+shots = [0, 1, 2]
+
+for shot in shots:
+    results_path = os.path.join(base_dir, f'{shot}-shot', 'results')
+    results_xml_path = os.path.join(base_dir, f'{shot}-shot', 'results-xml')
+
+    # Ensure the results-xml directory exists
+    if not os.path.exists(results_xml_path):
+        os.makedirs(results_xml_path)
+
+    # Loop through each result file in the results directory
+    if os.path.exists(results_path) and os.path.isdir(results_path):
+        for result_file in os.listdir(results_path):
+            file_path = os.path.join(results_path, result_file)
+            if file_path.endswith('.fireworks.ai.txt'):
+                with open(file_path, 'r') as file:
+                    result_content = file.read()
+
+                # Regular expression to find content enclosed by <coverPage>...</coverPage>
+                # This pattern ignores any text outside the XML tags
+                start_tag = "<coverPage>"
+                end_tag = "</coverPage>"
+
+                # Finding the last occurrence of the start_tag and the last occurrence of the end_tag
+                start = result_content.rfind(start_tag)
+                end = result_content.rfind(end_tag) + len(end_tag)
+
+                # If the start tag or end tag is not found, return an empty string or a specific message
+                if start == -1 or end == -1:
+                    print(f"No XML content found in {result_file}")
+
+                xml_content = result_content[start:end]
+
+
+                    # Prepares the filename and path for saving the extracted XML
+                xml_file_name = result_file.replace('.txt', '.xml')
+                xml_file_path = os.path.join(results_xml_path, xml_file_name)
+
+                    # Writes the XML content to a new file in the results-xml directory
+                with open(xml_file_path, 'w') as xml_file:
+                    xml_file.write(xml_content)
+                print(f'Extracted and saved XML for {xml_file_name}')
+```
--- a/prompt_engineering_fireworks.ai copy.ipynb
+++ b/prompt_engineering_fireworks.ai copy.ipynb
--- a/prompt_engineering_fireworks.ai.ipynb
+++ b/prompt_engineering_fireworks.ai.ipynb
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Install necessary packages\n",
+    "Langchain supports many LLM inference providers, including Fireworks."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install langchain\n",
+    "!pip install python-dotenv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 50,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 50,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "import requests\n",
+    "import json\n",
+    "\n",
+    "load_dotenv()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### API KEY\n",
+    "* register and get api key from : https://fireworks.ai/api-keys\n",
+    "* put the key in the file .env file in FIREWORKS_API_KEY variable"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "api_key = os.getenv(\"FIREWORKS_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# maximum number of tokens to generate by the model\n",
+    "max_tokens = {}\n",
+    "max_tokens[0] = 1000\n",
+    "max_tokens[1] = 1000\n",
+    "max_tokens[2] = 2000"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Prompting Models"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 49,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "models = [\n",
+    "     'accounts/fireworks/models/starcoder-7b', \n",
+    "     'accounts/fireworks/models/starcoder-16b', \n",
+    "     'accounts/fireworks/models/llama-v2-13b-code-instruct', \n",
+    "     'accounts/fireworks/models/llama-v2-34b-code-instruct',\n",
+    "     'accounts/fireworks/models/llama-v2-70b-code-instruct',\n",
+    "     'accounts/fireworks/models/mixtral-8x7b-instruct',\n",
+    "          ]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import requests\n",
+    "import json\n",
+    "\n",
+    "def send_fireworks_request(model, api_key, model_type='chat', prompt_or_messages=None, max_tokens=1024, \n",
+    "                           temperature=0.6, top_p=1, top_k=40, \n",
+    "                           frequency_penalty=0, presence_penalty=0):\n",
+    "    # Base URL and payload setup\n",
+    "    base_url = \"https://api.fireworks.ai/inference/v1/\"\n",
+    "    payload = {\n",
+    "        \"model\": model,\n",
+    "        \"max_tokens\": max_tokens,\n",
+    "        \"temperature\": temperature,\n",
+    "        \"top_p\": top_p,\n",
+    "        \"top_k\": top_k,\n",
+    "        \"presence_penalty\": presence_penalty,\n",
+    "        \"frequency_penalty\": frequency_penalty\n",
+    "    }\n",
+    "\n",
+    "    # Configure specific parameters for chat or completion\n",
+    "    if model_type == 'chat':\n",
+    "        url = base_url + \"chat/completions\"\n",
+    "        payload[\"messages\"] = prompt_or_messages\n",
+    "    elif model_type == 'completion':\n",
+    "        url = base_url + \"completions\"\n",
+    "        payload[\"prompt\"] = prompt_or_messages\n",
+    "    else:\n",
+    "        raise ValueError(\"Unsupported model type. Choose 'chat' or 'completion'.\")\n",
+    "\n",
+    "    headers = {\n",
+    "        \"Accept\": \"application/json\",\n",
+    "        \"Content-Type\": \"application/json\",\n",
+    "        \"Authorization\": f\"Bearer {api_key}\"\n",
+    "    }\n",
+    "    \n",
+    "    response = requests.post(url, json=payload, headers=headers)\n",
+    "    if response.status_code != 200:\n",
+    "        return {\"error\": response.json()}\n",
+    "    return response.json()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "shots = [0,1,2]\n",
+    "\n",
+    "for shot in shots:\n",
+    "    print(f'Processing shot: {shot}')\n",
+    "    \n",
+    "    base_path = f'data/prompts/{shot}-shot'\n",
+    "    prompt = open(f'{base_path}/prompt.txt', 'r').read()\n",
+    "    \n",
+    "    for model in models:\n",
+    "        model_name = model.split('/')[-1]\n",
+    "        print(f'Processing model: {model_name}')\n",
+    "        \n",
+    "        results_dir = f'{base_path}/results'\n",
+    "        \n",
+    "        if not os.path.exists(results_dir):\n",
+    "            os.makedirs(results_dir)\n",
+    "\n",
+    "        \n",
+    "        file_path = f'{results_dir}/{model_name}.fireworks.ai.txt'\n",
+    "        \n",
+    "        # Check if the result file already exists\n",
+    "        if os.path.exists(file_path):\n",
+    "            print('Skipping...')\n",
+    "            continue\n",
+    "\n",
+    "        llm = Fireworks(\n",
+    "\t\t\tfireworks_api_key=api_key,\n",
+    "\t\t\tmodel=model,\n",
+    "\t\t\tmax_tokens=max_tokens[shot])\n",
+    "        result = llm.invoke(prompt)\n",
+    "        \n",
+    "        with open(file_path, 'w') as file:\n",
+    "            file.write(result)  \n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### XML Extraction from results"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import re\n",
+    "\n",
+    "base_dir = 'data/prompts'\n",
+    "shots = [0, 1, 2]\n",
+    "\n",
+    "for shot in shots:\n",
+    "    results_path = os.path.join(base_dir, f'{shot}-shot', 'results')\n",
+    "    results_xml_path = os.path.join(base_dir, f'{shot}-shot', 'results-xml')\n",
+    "\n",
+    "    # Ensure the results-xml directory exists\n",
+    "    if not os.path.exists(results_xml_path):\n",
+    "        os.makedirs(results_xml_path)\n",
+    "    \n",
+    "    # Loop through each result file in the results directory\n",
+    "    if os.path.exists(results_path) and os.path.isdir(results_path):\n",
+    "        for result_file in os.listdir(results_path):\n",
+    "            file_path = os.path.join(results_path, result_file)\n",
+    "            if file_path.endswith('.fireworks.ai.txt'):\n",
+    "                with open(file_path, 'r') as file:\n",
+    "                    result_content = file.read()\n",
+    "                \n",
+    "                # Regular expression to find content enclosed by <coverPage>...</coverPage>\n",
+    "                # This pattern ignores any text outside the XML tags\n",
+    "                start_tag = \"<coverPage>\"\n",
+    "                end_tag = \"</coverPage>\"\n",
+    "                \n",
+    "                # Finding the last occurrence of the start_tag and the last occurrence of the end_tag\n",
+    "                start = result_content.rfind(start_tag)\n",
+    "                end = result_content.rfind(end_tag) + len(end_tag)\n",
+    "                \n",
+    "                # If the start tag or end tag is not found, return an empty string or a specific message\n",
+    "                if start == -1 or end == -1:\n",
+    "                    print(f\"No XML content found in {result_file}\")\n",
+    "                \n",
+    "                xml_content = result_content[start:end]\n",
+    "                \n",
+    "                    \n",
+    "                    # Prepares the filename and path for saving the extracted XML\n",
+    "                xml_file_name = result_file.replace('.txt', '.xml')\n",
+    "                xml_file_path = os.path.join(results_xml_path, xml_file_name)\n",
+    "                    \n",
+    "                    # Writes the XML content to a new file in the results-xml directory\n",
+    "                with open(xml_file_path, 'w') as xml_file:\n",
+    "                    xml_file.write(xml_content)\n",
+    "                print(f'Extracted and saved XML for {xml_file_name}')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
+%% Cell type:markdown id: tags:
+
+### Install necessary packages
+Langchain supports many LLM inference providers, including Fireworks.
+
+%% Cell type:code id: tags:
+
+``` python
+!pip install langchain
+!pip install python-dotenv
+```
+
+%% Cell type:code id: tags:
+
+``` python
+import os
+from dotenv import load_dotenv
+import requests
+import json
+
+load_dotenv()
+```
+
+%% Output
+
+    True
+
+%% Cell type:markdown id: tags:
+
+### API KEY
+* register and get api key from : https://fireworks.ai/api-keys
+* put the key in the file .env file in FIREWORKS_API_KEY variable
+
+%% Cell type:code id: tags:
+
+``` python
+api_key = os.getenv("FIREWORKS_API_KEY")
+```
+
+%% Cell type:code id: tags:
+
+``` python
+# maximum number of tokens to generate by the model
+max_tokens = {}
+max_tokens[0] = 1000
+max_tokens[1] = 1000
+max_tokens[2] = 2000
+```
+
+%% Cell type:markdown id: tags:
+
+### Prompting Models
+
+%% Cell type:code id: tags:
+
+``` python
+models = [
+     'accounts/fireworks/models/starcoder-7b',
+     'accounts/fireworks/models/starcoder-16b',
+     'accounts/fireworks/models/llama-v2-13b-code-instruct',
+     'accounts/fireworks/models/llama-v2-34b-code-instruct',
+     'accounts/fireworks/models/llama-v2-70b-code-instruct',
+     'accounts/fireworks/models/mixtral-8x7b-instruct',
+          ]
+```
+
+%% Cell type:code id: tags:
+
+``` python
+import requests
+import json
+
+def send_fireworks_request(model, api_key, model_type='chat', prompt_or_messages=None, max_tokens=1024,
+                           temperature=0.6, top_p=1, top_k=40,
+                           frequency_penalty=0, presence_penalty=0):
+    # Base URL and payload setup
+    base_url = "https://api.fireworks.ai/inference/v1/"
+    payload = {
+        "model": model,
+        "max_tokens": max_tokens,
+        "temperature": temperature,
+        "top_p": top_p,
+        "top_k": top_k,
+        "presence_penalty": presence_penalty,
+        "frequency_penalty": frequency_penalty
+    }
+
+    # Configure specific parameters for chat or completion
+    if model_type == 'chat':
+        url = base_url + "chat/completions"
+        payload["messages"] = prompt_or_messages
+    elif model_type == 'completion':
+        url = base_url + "completions"
+        payload["prompt"] = prompt_or_messages
+    else:
+        raise ValueError("Unsupported model type. Choose 'chat' or 'completion'.")
+
+    headers = {
+        "Accept": "application/json",
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {api_key}"
+    }
+
+    response = requests.post(url, json=payload, headers=headers)
+    if response.status_code != 200:
+        return {"error": response.json()}
+    return response.json()
+```
+
+%% Cell type:code id: tags:
+
+``` python
+shots = [0,1,2]
+
+for shot in shots:
+    print(f'Processing shot: {shot}')
+
+    base_path = f'data/prompts/{shot}-shot'
+    prompt = open(f'{base_path}/prompt.txt', 'r').read()
+
+    for model in models:
+        model_name = model.split('/')[-1]
+        print(f'Processing model: {model_name}')
+
+        results_dir = f'{base_path}/results'
+
+        if not os.path.exists(results_dir):
+            os.makedirs(results_dir)
+
+
+        file_path = f'{results_dir}/{model_name}.fireworks.ai.txt'
+
+        # Check if the result file already exists
+        if os.path.exists(file_path):
+            print('Skipping...')
+            continue
+
+        llm = Fireworks(
+			fireworks_api_key=api_key,
+			model=model,
+			max_tokens=max_tokens[shot])
+        result = llm.invoke(prompt)
+
+        with open(file_path, 'w') as file:
+            file.write(result)
+```
+
+%% Cell type:markdown id: tags:
+
+### XML Extraction from results
+
+%% Cell type:code id: tags:
+
+``` python
+import os
+import re
+
+base_dir = 'data/prompts'
+shots = [0, 1, 2]
+
+for shot in shots:
+    results_path = os.path.join(base_dir, f'{shot}-shot', 'results')
+    results_xml_path = os.path.join(base_dir, f'{shot}-shot', 'results-xml')
+
+    # Ensure the results-xml directory exists
+    if not os.path.exists(results_xml_path):
+        os.makedirs(results_xml_path)
+
+    # Loop through each result file in the results directory
+    if os.path.exists(results_path) and os.path.isdir(results_path):
+        for result_file in os.listdir(results_path):
+            file_path = os.path.join(results_path, result_file)
+            if file_path.endswith('.fireworks.ai.txt'):
+                with open(file_path, 'r') as file:
+                    result_content = file.read()
+
+                # Regular expression to find content enclosed by <coverPage>...</coverPage>
+                # This pattern ignores any text outside the XML tags
+                start_tag = "<coverPage>"
+                end_tag = "</coverPage>"
+
+                # Finding the last occurrence of the start_tag and the last occurrence of the end_tag
+                start = result_content.rfind(start_tag)
+                end = result_content.rfind(end_tag) + len(end_tag)
+
+                # If the start tag or end tag is not found, return an empty string or a specific message
+                if start == -1 or end == -1:
+                    print(f"No XML content found in {result_file}")
+
+                xml_content = result_content[start:end]
+
+
+                    # Prepares the filename and path for saving the extracted XML
+                xml_file_name = result_file.replace('.txt', '.xml')
+                xml_file_path = os.path.join(results_xml_path, xml_file_name)
+
+                    # Writes the XML content to a new file in the results-xml directory
+                with open(xml_file_path, 'w') as xml_file:
+                    xml_file.write(xml_content)
+                print(f'Extracted and saved XML for {xml_file_name}')
+```
--- a/xml_validation.ipynb
+++ b/xml_validation.ipynb
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import xml.etree.ElementTree as ET\n",
+    "import os"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def validate_xml(xml_file):\n",
+    "    try:\n",
+    "        tree = ET.parse(xml_file)\n",
+    "        return True, \"\"\n",
+    "    except ET.ParseError as e:\n",
+    "        return False, f\"XML is not well-formed: {e}\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Evaluating 0-shot\n",
+      "====================\n",
+      "zephyr-7b-alpha.gpt.grc.xml is True: \n",
+      "zephyr-7b-beta.gpt.grc.xml is True: \n",
+      "gpt-35-turbo-0301.gpt.grc.xml is True: \n",
+      "mistral-7b-openorca.xml is True: \n",
+      "gpt-4-32k.gpt.grc.xml is True: \n",
+      "llama-2-70b-chat.xml is False: XML is not well-formed: mismatched tag: line 12, column 8\n",
+      "gpt-35-turbo-16k.grc.xml is True: \n",
+      "gpt-4.grc.xml is True: \n",
+      "llama-2-13b-chat.xml is True: \n",
+      "Evaluating 1-shot\n",
+      "====================\n",
+      "starcoder-16b.fireworks.ai.xml is False: XML is not well-formed: syntax error: line 2, column 0\n",
+      "llama-v2-34b-code-instruct.fireworks.ai.xml is True: \n",
+      "llama-v2-13b-code-instruct.xml is True: \n",
+      "starcoder-7b.fireworks.ai.xml is False: XML is not well-formed: syntax error: line 2, column 0\n",
+      "mixtral-8x7b-instruct_fireworks.ai.xml is True: \n",
+      "llama-2-70b-chat.gpt.jrc.xml is True: \n",
+      "zephyr-7b-beta.gpt.jrc.xml is True: \n",
+      "nous-hermes-2-mixtral-8x7b-dpo-gpt.jrc.xml is True: \n",
+      "mistral-7b-openorca.gpt.jrc.xml is True: \n",
+      "zephyr-7b-alpha.gpt.jrc.xml is True: \n",
+      "Evaluating 2-shot\n",
+      "====================\n",
+      "starcoder-16b.fireworks.ai.xml is False: XML is not well-formed: not well-formed (invalid token): line 2, column 1\n",
+      "llama-v2-34b-code-instruct.fireworks.ai.xml is True: \n",
+      "llama-v2-13b-code-instruct.fireworks.ai.xml is True: \n",
+      "starcoder-7b.fireworks.ai.xml is False: XML is not well-formed: not well-formed (invalid token): line 60, column 51\n",
+      "mixtral-8x7b-instruct.fireworks.ai.xml is False: XML is not well-formed: mismatched tag: line 50, column 26\n",
+      "zephyr-7b-beta.gpt.jrc.xml is False: XML is not well-formed: junk after document element: line 39, column 0\n",
+      "nous-hermes-2-mixtral-8x7b-dpo-gpt.jrc.xml is True: \n",
+      "mistral-7b-openorca.gpt.jrc.xml is True: \n",
+      "zephyr-7b-alpha.gpt.jrc.xml is True: \n"
+     ]
+    }
+   ],
+   "source": [
+    "shots = [0,1,2]\n",
+    "\n",
+    "for shot in shots:\n",
+    "    print(f'Evaluating {shot}-shot')\n",
+    "    print('='*20)\n",
+    "    result_xml_dir = f'data/prompts/{shot}-shot/results-xml/'\n",
+    "    xml_files = [f for f in os.listdir(result_xml_dir) if f.endswith('.xml')]\n",
+    "    for xml_file in xml_files:\n",
+    "        is_valid, message = validate_xml(f'{result_xml_dir}/{xml_file}')\n",
+    "        print(f'{xml_file} is {is_valid}: {message}')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "myenv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
+%% Cell type:code id: tags:
+
+``` python
+import xml.etree.ElementTree as ET
+import os
+```
+
+%% Cell type:code id: tags:
+
+``` python
+def validate_xml(xml_file):
+    try:
+        tree = ET.parse(xml_file)
+        return True, ""
+    except ET.ParseError as e:
+        return False, f"XML is not well-formed: {e}"
+```
+
+%% Cell type:code id: tags:
+
+``` python
+shots = [0,1,2]
+
+for shot in shots:
+    print(f'Evaluating {shot}-shot')
+    print('='*20)
+    result_xml_dir = f'data/prompts/{shot}-shot/results-xml/'
+    xml_files = [f for f in os.listdir(result_xml_dir) if f.endswith('.xml')]
+    for xml_file in xml_files:
+        is_valid, message = validate_xml(f'{result_xml_dir}/{xml_file}')
+        print(f'{xml_file} is {is_valid}: {message}')
+```
+
+%% Output
+
+    Evaluating 0-shot
+    ====================
+    zephyr-7b-alpha.gpt.grc.xml is True:
+    zephyr-7b-beta.gpt.grc.xml is True:
+    gpt-35-turbo-0301.gpt.grc.xml is True:
+    mistral-7b-openorca.xml is True:
+    gpt-4-32k.gpt.grc.xml is True:
+    llama-2-70b-chat.xml is False: XML is not well-formed: mismatched tag: line 12, column 8
+    gpt-35-turbo-16k.grc.xml is True:
+    gpt-4.grc.xml is True:
+    llama-2-13b-chat.xml is True:
+    Evaluating 1-shot
+    ====================
+    starcoder-16b.fireworks.ai.xml is False: XML is not well-formed: syntax error: line 2, column 0
+    llama-v2-34b-code-instruct.fireworks.ai.xml is True:
+    llama-v2-13b-code-instruct.xml is True:
+    starcoder-7b.fireworks.ai.xml is False: XML is not well-formed: syntax error: line 2, column 0
+    mixtral-8x7b-instruct_fireworks.ai.xml is True:
+    llama-2-70b-chat.gpt.jrc.xml is True:
+    zephyr-7b-beta.gpt.jrc.xml is True:
+    nous-hermes-2-mixtral-8x7b-dpo-gpt.jrc.xml is True:
+    mistral-7b-openorca.gpt.jrc.xml is True:
+    zephyr-7b-alpha.gpt.jrc.xml is True:
+    Evaluating 2-shot
+    ====================
+    starcoder-16b.fireworks.ai.xml is False: XML is not well-formed: not well-formed (invalid token): line 2, column 1
+    llama-v2-34b-code-instruct.fireworks.ai.xml is True:
+    llama-v2-13b-code-instruct.fireworks.ai.xml is True:
+    starcoder-7b.fireworks.ai.xml is False: XML is not well-formed: not well-formed (invalid token): line 60, column 51
+    mixtral-8x7b-instruct.fireworks.ai.xml is False: XML is not well-formed: mismatched tag: line 50, column 26
+    zephyr-7b-beta.gpt.jrc.xml is False: XML is not well-formed: junk after document element: line 39, column 0
+    nous-hermes-2-mixtral-8x7b-dpo-gpt.jrc.xml is True:
+    mistral-7b-openorca.gpt.jrc.xml is True:
+    zephyr-7b-alpha.gpt.jrc.xml is True:
+
+%% Cell type:code id: tags:
+
+``` python
+```