var m=Object.defineProperty,c=Object.defineProperties;var d=Object.getOwnPropertyDescriptors;var r=Object.getOwnPropertySymbols;var s=Object.prototype.hasOwnProperty,i=Object.prototype.propertyIsEnumerable;var p=(e,t,a)=>t in e?m(e,t,{enumerable:!0,configurable:!0,writable:!0,value:a}):e[t]=a,n=(e,t)=>{for(var a in t||(t={}))s.call(t,a)&&p(e,a,t[a]);if(r)for(var a of r(t))i.call(t,a)&&p(e,a,t[a]);return e},h=(e,t)=>c(e,d(t));var l=(e,t)=>{var a={};for(var o in e)s.call(e,o)&&t.indexOf(o)<0&&(a[o]=e[o]);if(e!=null&&r)for(var o of r(e))t.indexOf(o)<0&&i.call(e,o)&&(a[o]=e[o]);return a};const layoutProps={},MDXLayout="wrapper";function MDXContent(a){var o=a,{components:e}=o,t=l(o,["components"]);return mdx(MDXLayout,h(n(n({},layoutProps),t),{components:e,mdxType:"MDXLayout"}),mdx("h2",null,"Note"),mdx("h3",null,"Prompt Template"),mdx("p",null,"For utilizing Zephyr-7B-\u03B1, a prompt template is provided. This template allows users to interact with the model effectively. Example prompt template:"),mdx("pre",null,mdx("code",{parentName:"pre"},`<|system|> <|user|> {prompt} <|assistant|> `)),mdx("p",null,"Example"),mdx("pre",null,mdx("code",{parentName:"pre"},`<|system|> You are a friendly chatbot who always responds in the style of a pirate. <|user|> How many helicopters can a human eat in one sitting? <|assistant|> `)),mdx("h2",null,"Introduction"),mdx("p",null,mdx("strong",{parentName:"p"},"Zephyr")," is a series of language models designed to serve as helpful assistants. ",mdx("strong",{parentName:"p"},"Zephyr-7B-\u03B1")," is the first model in this series and represents a fine-tuned version of ",mdx("strong",{parentName:"p"},"mistralai/Mistral-7B-v0.1"),". It was trained on a combination of publicly available and synthetic datasets using ",mdx("a",n({parentName:"p"},{href:"https://arxiv.org/abs/2305.18290"}),mdx("strong",{parentName:"a"},"Direct Preference Optimization (DPO)"))," to improve its performance. Model outperform ",mdx("strong",{parentName:"p"},"Llama 2 70B")," Chat on ",mdx("strong",{parentName:"p"},"MT Bench")),mdx("h2",null,"Zephyr-7B-\u03B1"),mdx("p",null,mdx("strong",{parentName:"p"},"Zephyr-7B-\u03B1")," is the first model in the Zephyr series and is based on mistralai/Mistral-7B-v0.1. It has been fine-tuned using ",mdx("a",n({parentName:"p"},{href:"https://arxiv.org/abs/2305.18290"}),mdx("strong",{parentName:"a"},"Direct Preference Optimization (DPO)"))," on a mix of publicly available and synthetic datasets. Notably, the in-built alignment of these datasets was removed to boost performance on the ",mdx("strong",{parentName:"p"},"MT Bench")," and make the model more helpful."),mdx("h2",null,"Run Zephyr 7B with an API"),mdx("p",null,"You can run the Zephyr 7B Model API using Clarifai\u2019s python SDK."),mdx("p",null,"Export your PAT as an environment variable"),mdx("p",null,"**export CLARIFAI_PAT={your personal access token}**"),mdx("p",null,"Check out the Code below to run the Model:"),mdx("pre",null,mdx("code",{parentName:"pre"},`import os from clarifai.client.model import Model system_message = "You are a friendly chatbot who always responds in the style of a pirate." prompt = "Write a tweet on future of AI" prompt_template = f"<|system|> \\ {system_message}\\ \\ <|user|>\\ {prompt}\\ <|assistant|>" # Model Predict model_prediction = Model("https://clarifai.com/huggingface-research/zephyr/models/zephyr-7B-alpha").predict_by_bytes(prompt_template.encode(), "text") print(model_prediction.outputs[0].data.text.raw) `)),mdx("p",null,"You can also run Zephyr 7B API using other Clarifai Client Libraries like Java, cURL, NodeJS, PHP, etc ",mdx("a",n({parentName:"p"},{href:"https://docs.clarifai.com/api-guide/api-overview/api-clients/?__hstc=26175983.c2454e9f3ace1e18a0dec848032e57c3.1687844901596.1697534384608.1697698491119.65&__hssc=26175983.3.1697698491119&__hsfp=2687445620"}),"here"),"."),mdx("h2",null,"Use Cases"),mdx("p",null,"Zephyr-7B-\u03B1 was initially fine-tuned on a variant of the UltraChat dataset, which includes synthetic dialogues generated by ChatGPT. Further alignment was achieved using huggingface TRL\u2019s DPOTrainer on the openbmb/UltraFeedback dataset, consisting of prompts and model completions ranked by GPT-4. This allows the model to be used for ",mdx("strong",{parentName:"p"},"chat applications.")),mdx("h2",null,mdx("strong",{parentName:"h2"},"Limitations")),mdx("p",null,"Zephyr-7B-\u03B1 has not been aligned to human preferences using techniques like Reinforcement Learning from Human Feedback (RLHF), nor has it undergone in-the-loop filtering of responses like ChatGPT. As a result, it can produce outputs that may be problematic, especially when intentionally prompted. It is also unknown what the size and composition of the corpus was used to train the base model (","mistralai/Mistral-7B-v0.1","), however it is likely to have included a mix of Web data and technical sources like books and code. See the ",mdx("a",n({parentName:"p"},{href:"https://huggingface.co/tiiuae/falcon-180B#training-data"}),"Falcon 180B model card")," for an example of this"))}MDXContent.isMDXComponent=!0;