Upload folder using huggingface_hub
Browse files- config.json +33 -0
- mergekit_moe_config.yml +139 -0
- model-00001-of-00003.safetensors +3 -0
- model-00002-of-00003.safetensors +3 -0
- model-00003-of-00003.safetensors +3 -0
- model.safetensors.index.json +1 -0
- special_tokens_map.json +24 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +42 -0
config.json
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "HuggingFaceTB/cosmo-1b",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 2048,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 8192,
|
14 |
+
"max_position_embeddings": 2048,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 16,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 24,
|
19 |
+
"num_key_value_heads": 16,
|
20 |
+
"num_local_experts": 8,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pretraining_tp": 1,
|
23 |
+
"rms_norm_eps": 1e-05,
|
24 |
+
"rope_scaling": null,
|
25 |
+
"rope_theta": 10000.0,
|
26 |
+
"router_aux_loss_coef": 0.001,
|
27 |
+
"sliding_window": null,
|
28 |
+
"tie_word_embeddings": false,
|
29 |
+
"torch_dtype": "bfloat16",
|
30 |
+
"transformers_version": "4.38.1",
|
31 |
+
"use_cache": true,
|
32 |
+
"vocab_size": 32000
|
33 |
+
}
|
mergekit_moe_config.yml
ADDED
@@ -0,0 +1,139 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: HuggingFaceTB/cosmo-1b
|
2 |
+
gate_mode: hidden # one of "hidden", "cheap_embed", or "random"
|
3 |
+
dtype: bfloat16 # output dtype (float32, float16, or bfloat16)
|
4 |
+
experts_per_token: 2
|
5 |
+
experts:
|
6 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
7 |
+
positive_prompts:
|
8 |
+
- "List three synonyms for the word 'happy'."
|
9 |
+
- "Imagine you are developing an innovative project or initiative that combines the thrilling worlds of sports, such as Cricket, Basketball, Football, Soccer, Baseball, Ice Hockey, and Video Games. Consider how strategy, performance, and unexpected journeys intersect within these domains. How might you create a platform or experience that transcends traditional boundaries, allowing athletes and fans to explore new dimensions of competition, collaboration, and storytelling? Delve into the potential applications, impacts, and novel questions that arise from this intersection, pushing the limits of creativity and innovation to uncover exciting, original possibilities."
|
10 |
+
- "Imagine a project that combines the thrilling world of professional wrestling with the engaging narrative design of video games, set in the performing arts realm. How might you create dynamic characters, inspired by real-life wrestlers, that embody the athleticism and entertainment aspects of wrestling, while also weaving in thoughtful career development and music-based storytelling? Consider how technology could enhance this experience, enabling in-depth analysis of matches and character development through data-driven insights. Ultimately, this initiative could generate novel questions about the intersection of sports, entertainment, and technology, while providing fans with an immersive and innovative way to engage with their favorite wrestlers and stories."
|
11 |
+
- "Imagine a community center that brings together the worlds of paper mache, film history, and anime fandom, while also promoting fitness and personal growth. How might this unique space look, feel, and function? What kind of programs, activities, or events could it host to engage and inspire its members? Consider the potential impacts on communication, collaboration, and creativity. Now, imagine this center has a bakery that not only serves delicious treats but also serves as a platform for storytelling and adventure. How might these themes intertwine and enrich each other? What novel questions, opportunities, or challenges arise from their intersection? Please describe your innovative project or initiative that integrates these themes."
|
12 |
+
- "Imagine you are a conceptual artist embarking on a groundbreaking exhibition that explores the intersection of the cosmos and creativity. How might you use a telescope as a tool for photography, capturing images of stars and constellations to create visual art pieces? Consider how different weather conditions and geographic locations could influence your artwork, and how the process of exploration, both physical and intellectual, might inspire your project. Delve into the novel questions, potential applications, and impacts that arise from this intersection of themes, pushing the boundaries of traditional art and scientific inquiry."
|
13 |
+
negative_prompts:
|
14 |
+
- "Imagine you are tasked with creating a unique, innovative project that combines the themes of pharmaceutical manufacturing, geometric design, and personalization. How might you incorporate artistry into the production process, and what role could ceramic mugs play in this initiative? Additionally, consider how this project could intersect with American football culture and product marketing. How might the project be applied to weddings, and what novel questions or impacts could arise from this intersection? Explore potential concepts, applications, and implications for this integrated project."
|
15 |
+
- "Imagine a world where cryptocurrency trading is enhanced by advanced mathematical models and technologies. Consider the possibilities of integrating matrices, regression analysis, and probability distributions to optimize trading strategies and blockchain transactions. How might the principles of refraction and rings inspire new approaches to data visualization and security in this context? Could such a system help address challenges of transparency, volatility, and risk management in cryptocurrency markets? Explore how these themes can intersect to create an innovative, impactful project or initiative that transforms the future of cryptocurrency and data analysis."
|
16 |
+
- "Imagine a groundbreaking project or initiative that addresses the intersection of state violence, international relations, and collective bargaining. How could this project also promote accessibility, education, and disability rights at the local level? Consider the role of philanthropy and community engagement in ensuring the project's success and sustainability. What novel questions or challenges might arise from this intersection of themes, and how might they be addressed?"
|
17 |
+
- "Imagine weaving together the realms of spirituality, Christian theology, and prayer with hair care, skin care, and beauty products, all while incorporating elements of alternative medicine. How might these themes intersect to create a unique project or initiative that promotes holistic well-being, inner peace, and outer beauty? Consider the potential applications, impacts, and novel questions that arise from this fusion, and brainstorm innovative concepts that challenge traditional boundaries and encourage mindful self-care practices."
|
18 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
19 |
+
positive_prompts:
|
20 |
+
- "Combine these two sentences into a complex sentence using the word 'because': The girl was tired. She went to sleep early."
|
21 |
+
- "Imagine a world where astrology, timekeeping, and technology intersect to create a revolutionary online dating platform. This platform uses jewelry, metals, and lighting design to visually represent individual astrological charts, while also serving as functional timekeeping devices. How might wearable, interactive, and customizable pieces of jewelry, such as smartwatches or brooches, display a person's astrological profile and facilitate connections with compatible partners based on shared interests, values, or cosmic energies? As users engage with the platform, they can study their own astrological charts and those of potential partners, deepening their understanding of astrology while also exploring the intricacies of watchmaking and horology. Furthermore, how might this integration of themes impact the fashion industry by encouraging the creation of statement pieces that serve both functional and symbolic purposes? Through this project, we could examine the potential applications, impacts, and novel questions that arise from the intersection of these diverse fields."
|
22 |
+
- "Imagine you are tasked with creating a unique, innovative project that combines the themes of pharmaceutical manufacturing, geometric design, and personalization. How might you incorporate artistry into the production process, and what role could ceramic mugs play in this initiative? Additionally, consider how this project could intersect with American football culture and product marketing. How might the project be applied to weddings, and what novel questions or impacts could arise from this intersection? Explore potential concepts, applications, and implications for this integrated project."
|
23 |
+
- "Imagine a groundbreaking initiative that interweaves the themes of water, cleaning, maintenance, home improvement, repair, business jets, automotive parts, and suspension systems. Envisision a project that revolutionizes how we manage and utilize water resources while incorporating advanced cleaning technologies and innovative maintenance solutions for both residential settings and business aviation. How might this project integrate cutting-edge suspension systems in both automotive parts and business jets, creating synergies between land and air transportation? Consider the potential applications, environmental impacts, and novel questions arising from this intersection, inviting a paradigm shift in sustainability, mobility, and systemic design."
|
24 |
+
- "Imagine a world where batteries in electric vehicles (EVs) are repurposed as sustainable energy storage solutions for waste management facilities, while also providing habitats for pollinator insects like bees. How might entomology and apiculture contribute to this closed-loop system, and what novel questions or challenges arise from this intersection of technology, waste management, environment, and sustainability? Explore the potential applications and impacts of such an innovative project, and consider how the integration of these diverse fields could lead to innovative solutions for a more sustainable future."
|
25 |
+
- "Imagine a project that combines the artisanal practices of coffee roasting, wine making, and craft distilleries with innovative techniques and culinary arts. How might the flavors and aromas of these beverages intersect with the world of baking, Cantonese cuisine, and mayonnaise creation? Consider the equipment and traditions behind fishing, and how they might influence travel and the sharing of culinary knowledge. How can we use these intersections to explore new impacts on local economies, sustainability, and the future of food and drink? Generate ideas for an innovative project that brings these themes together in a unique and engaging way."
|
26 |
+
negative_prompts:
|
27 |
+
- "Imagine you are developing an innovative project or initiative that combines the thrilling worlds of sports, such as Cricket, Basketball, Football, Soccer, Baseball, Ice Hockey, and Video Games. Consider how strategy, performance, and unexpected journeys intersect within these domains. How might you create a platform or experience that transcends traditional boundaries, allowing athletes and fans to explore new dimensions of competition, collaboration, and storytelling? Delve into the potential applications, impacts, and novel questions that arise from this intersection, pushing the limits of creativity and innovation to uncover exciting, original possibilities."
|
28 |
+
- "In the era of the Digital Age, how can we leverage the nostalgia of vintage gaming, the convenience of wireless speakers and smartphones, and the advanced capabilities of modern audio systems to create an innovative consumer electronics initiative that prioritizes data privacy and protection, while also raising awareness and sparking curiosity about the intersection of technology and privacy in our increasingly connected world? Consider potential applications, impacts on user experience and societal norms, and novel questions that arise from the integration of these themes."
|
29 |
+
- "Imagine a world where the healing powers of cannabis and the unconditional love of dogs come together to improve veterinary medicine, training, and oral health. How might we innovatively integrate these themes to create a novel project or initiative? Consider potential applications such as developing cannabis-based dental care products for dogs, using CBD oil to aid in training and behavior management, or establishing veterinary clinics that specialize in holistic care for dogs, including dental hygiene and alternative therapies. What impacts could this have on the well-being of our canine companions, the veterinary field, and the innovation of oral health solutions? How might this intersection challenge and expand our understanding of these themes and their practical applications? Explore and generate ideas that push the boundaries of what is currently possible, and consider the novel questions that arise from their intersection."
|
30 |
+
- "Imagine a city of the future where public safety, urban development, and transportation intersect to create a seamless, integrated, and sustainable urban experience. How might public transit, shipping, and vehicle operations be reimagined to enhance public safety while promoting efficient transportation and business operations? Consider the role of insurance in mitigating risks associated with these innovations and the legal profession in navigating the complex web of regulations and policies that will emerge. How can we leverage advances in technology, data analysis, and urban planning to create an environment that is safe, accessible, and equitable for all members of our society? Generate novel ideas or concepts that integrate these themes and explore their potential applications, impacts, and the legal and ethical questions that arise from their intersection."
|
31 |
+
- "Imagine a groundbreaking initiative that combines the art of dance, the practice of yoga, and a deep understanding of child development to create innovative therapeutic interventions for children facing health challenges. How might this intersection inspire novel questions in the realms of immunology, cancer research, and therapeutic drugs? Furthermore, consider how nutrition, general health, supplements, and diet could be integrated to optimize these interventions and enhance their impact. Envision the potential applications and benefits of such a holistic approach, and brainstorm ways to measure its success and evaluate its effectiveness."
|
32 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
33 |
+
positive_prompts:
|
34 |
+
- "Read the following passage about planets.
|
35 |
+
|
36 |
+
'The Planets of Our Solar System
|
37 |
+
|
38 |
+
Our solar system is a fascinating place! It has a big, bright star called the Sun. The Sun is the center, and eight planets travel around it. These planets are very different from each other.
|
39 |
+
|
40 |
+
Mercury is the smallest planet and closest to the Sun. Venus is the hottest planet. Earth is our home. It's the only planet we know of that has life. Mars is a red, dusty planet with two small moons named Phobos and Deimos. Jupiter is the biggest planet. It's a giant ball of gas with a huge storm called the Great Red Spot. Saturn has beautiful rings made of ice and rock. Uranus and Neptune are cold, blue planets far from the Sun.'
|
41 |
+
|
42 |
+
How many moons does Mars have?"
|
43 |
+
- "Imagine a world where cryptocurrency trading is enhanced by advanced mathematical models and technologies. Consider the possibilities of integrating matrices, regression analysis, and probability distributions to optimize trading strategies and blockchain transactions. How might the principles of refraction and rings inspire new approaches to data visualization and security in this context? Could such a system help address challenges of transparency, volatility, and risk management in cryptocurrency markets? Explore how these themes can intersect to create an innovative, impactful project or initiative that transforms the future of cryptocurrency and data analysis."
|
44 |
+
- "In the era of the Digital Age, how can we leverage the nostalgia of vintage gaming, the convenience of wireless speakers and smartphones, and the advanced capabilities of modern audio systems to create an innovative consumer electronics initiative that prioritizes data privacy and protection, while also raising awareness and sparking curiosity about the intersection of technology and privacy in our increasingly connected world? Consider potential applications, impacts on user experience and societal norms, and novel questions that arise from the integration of these themes."
|
45 |
+
- "Imagine you are part of a cross-functional team tasked with creating an innovative digital solution that revolutionizes the way businesses operate and communicate in the modern digital landscape. Your task is to develop a concept that integrates themes of email communication, cybersecurity, digital systems, online communication, platform evolution, digital marketing, SEO, business strategies, project management, agile methodologies, interactive marketing, and more. How might you leverage the power of these interconnected themes to build a secure, efficient, and user-friendly digital platform that enhances business communication, collaboration, and growth? Consider potential applications, impacts, and novel questions that arise from this intersection, as well as the ways in which this project could transform the way we approach digital systems and online interactions in the business world and beyond."
|
46 |
+
- "Imagine a comprehensive financial management platform that seamlessly integrates themes of marketing, business, and data with retirement planning, taxation, and financial record-keeping. This platform could also provide real-time insights into the stock market, institutional investing, and personal finance, while offering home loans, credit cards, and title loans with competitive interest rates. Additionally, it could serve as a brokerage for real estate and other investments, utilizing AI-driven algorithms to optimize portfolios and maximize returns. How might such a platform revolutionize the way individuals and businesses manage their finances, and what new opportunities, challenges, and questions would arise from the intersection of these themes?"
|
47 |
+
negative_prompts:
|
48 |
+
- "Imagine a community center that brings together the worlds of paper mache, film history, and anime fandom, while also promoting fitness and personal growth. How might this unique space look, feel, and function? What kind of programs, activities, or events could it host to engage and inspire its members? Consider the potential impacts on communication, collaboration, and creativity. Now, imagine this center has a bakery that not only serves delicious treats but also serves as a platform for storytelling and adventure. How might these themes intertwine and enrich each other? What novel questions, opportunities, or challenges arise from their intersection? Please describe your innovative project or initiative that integrates these themes."
|
49 |
+
- "Imagine a world where spirituality, mental health, and personal growth are seamlessly intertwined to create holistic well-being. How might we design an innovative project or initiative that addresses information overload, trauma, addiction, and counseling through the lenses of these themes? Explore potential applications, impacts, and novel questions that arise from the intersection of these areas, envisioning a future where individuals can heal, grow, and thrive in a supportive and integrated environment."
|
50 |
+
- "Imagining Interdisciplinary Solutions: How might we integrate the themes of medical malpractice, product liability, and personal injury with firefighting, safety protocols, and emergency response to create innovative approaches that enhance patient safety, product accountability, and community protection? Explore potential applications, impacts, or novel questions that arise from the intersection of these fields, and consider how integrated systems could improve patient outcomes, promote safer products, and strengthen emergency response capabilities."
|
51 |
+
- "Imagine a world where astrology, timekeeping, and technology intersect to create a revolutionary online dating platform. This platform uses jewelry, metals, and lighting design to visually represent individual astrological charts, while also serving as functional timekeeping devices. How might wearable, interactive, and customizable pieces of jewelry, such as smartwatches or brooches, display a person's astrological profile and facilitate connections with compatible partners based on shared interests, values, or cosmic energies? As users engage with the platform, they can study their own astrological charts and those of potential partners, deepening their understanding of astrology while also exploring the intricacies of watchmaking and horology. Furthermore, how might this integration of themes impact the fashion industry by encouraging the creation of statement pieces that serve both functional and symbolic purposes? Through this project, we could examine the potential applications, impacts, and novel questions that arise from the intersection of these diverse fields."
|
52 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
53 |
+
positive_prompts:
|
54 |
+
- "What are the next two numbers in the sequence: 1, 4, 9, 16..."
|
55 |
+
- "Imagine a world where the healing powers of cannabis and the unconditional love of dogs come together to improve veterinary medicine, training, and oral health. How might we innovatively integrate these themes to create a novel project or initiative? Consider potential applications such as developing cannabis-based dental care products for dogs, using CBD oil to aid in training and behavior management, or establishing veterinary clinics that specialize in holistic care for dogs, including dental hygiene and alternative therapies. What impacts could this have on the well-being of our canine companions, the veterinary field, and the innovation of oral health solutions? How might this intersection challenge and expand our understanding of these themes and their practical applications? Explore and generate ideas that push the boundaries of what is currently possible, and consider the novel questions that arise from their intersection."
|
56 |
+
- "Imagine weaving together the realms of spirituality, Christian theology, and prayer with hair care, skin care, and beauty products, all while incorporating elements of alternative medicine. How might these themes intersect to create a unique project or initiative that promotes holistic well-being, inner peace, and outer beauty? Consider the potential applications, impacts, and novel questions that arise from this fusion, and brainstorm innovative concepts that challenge traditional boundaries and encourage mindful self-care practices."
|
57 |
+
- "Imagine a groundbreaking initiative that combines the art of dance, the practice of yoga, and a deep understanding of child development to create innovative therapeutic interventions for children facing health challenges. How might this intersection inspire novel questions in the realms of immunology, cancer research, and therapeutic drugs? Furthermore, consider how nutrition, general health, supplements, and diet could be integrated to optimize these interventions and enhance their impact. Envision the potential applications and benefits of such a holistic approach, and brainstorm ways to measure its success and evaluate its effectiveness."
|
58 |
+
- "Imagine a world where spirituality, mental health, and personal growth are seamlessly intertwined to create holistic well-being. How might we design an innovative project or initiative that addresses information overload, trauma, addiction, and counseling through the lenses of these themes? Explore potential applications, impacts, and novel questions that arise from the intersection of these areas, envisioning a future where individuals can heal, grow, and thrive in a supportive and integrated environment."
|
59 |
+
- "Imagine you are designing an innovative project or initiative that intersects the themes of Navigating Medical School, Healthcare Innovation, Geriatric Care, Public Health, Education, and Crisis Communication. How can you create synergy between these areas to address current and future challenges in healthcare? Consider potential applications, impacts, and novel questions that arise from their intersection. For instance, how might reimagining medical education to focus on geriatric care and public health crisis management spur healthcare innovation and improve communication strategies during crises? Explore the possibilities and implications of this integrated approach."
|
60 |
+
negative_prompts:
|
61 |
+
- "Imagine a project that integrates the themes of energy policy, research, writing, analysis, and sustainability. How might these areas intersect to create innovative solutions for a more sustainable future? Consider the potential applications of new energy policies that prioritize renewable resources and reduce dependence on fossil fuels. What novel questions arise when examining the intersection of energy policy and sustainability through a research and analysis lens? How might your writing contribute to the ongoing discourse surrounding these critical issues? Please develop a concept that addresses these themes and offers a unique perspective or approach to tackling the challenges at the nexus of energy, policy, and sustainability."
|
62 |
+
- "Imagine you are part of a cross-functional team tasked with creating an innovative digital solution that revolutionizes the way businesses operate and communicate in the modern digital landscape. Your task is to develop a concept that integrates themes of email communication, cybersecurity, digital systems, online communication, platform evolution, digital marketing, SEO, business strategies, project management, agile methodologies, interactive marketing, and more. How might you leverage the power of these interconnected themes to build a secure, efficient, and user-friendly digital platform that enhances business communication, collaboration, and growth? Consider potential applications, impacts, and novel questions that arise from this intersection, as well as the ways in which this project could transform the way we approach digital systems and online interactions in the business world and beyond."
|
63 |
+
- "Imagine you are a conceptual artist embarking on a groundbreaking exhibition that explores the intersection of the cosmos and creativity. How might you use a telescope as a tool for photography, capturing images of stars and constellations to create visual art pieces? Consider how different weather conditions and geographic locations could influence your artwork, and how the process of exploration, both physical and intellectual, might inspire your project. Delve into the novel questions, potential applications, and impacts that arise from this intersection of themes, pushing the boundaries of traditional art and scientific inquiry."
|
64 |
+
- "Imagine a groundbreaking initiative that interweaves the themes of water, cleaning, maintenance, home improvement, repair, business jets, automotive parts, and suspension systems. Envisision a project that revolutionizes how we manage and utilize water resources while incorporating advanced cleaning technologies and innovative maintenance solutions for both residential settings and business aviation. How might this project integrate cutting-edge suspension systems in both automotive parts and business jets, creating synergies between land and air transportation? Consider the potential applications, environmental impacts, and novel questions arising from this intersection, inviting a paradigm shift in sustainability, mobility, and systemic design."
|
65 |
+
- "Imagine a project that combines the artisanal practices of coffee roasting, wine making, and craft distilleries with innovative techniques and culinary arts. How might the flavors and aromas of these beverages intersect with the world of baking, Cantonese cuisine, and mayonnaise creation? Consider the equipment and traditions behind fishing, and how they might influence travel and the sharing of culinary knowledge. How can we use these intersections to explore new impacts on local economies, sustainability, and the future of food and drink? Generate ideas for an innovative project that brings these themes together in a unique and engaging way."
|
66 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
67 |
+
positive_prompts:
|
68 |
+
- "Provide two antonyms for the word 'cold'."
|
69 |
+
- "Imagine a groundbreaking project or initiative that addresses the intersection of state violence, international relations, and collective bargaining. How could this project also promote accessibility, education, and disability rights at the local level? Consider the role of philanthropy and community engagement in ensuring the project's success and sustainability. What novel questions or challenges might arise from this intersection of themes, and how might they be addressed?"
|
70 |
+
- "Imagine a city of the future where public safety, urban development, and transportation intersect to create a seamless, integrated, and sustainable urban experience. How might public transit, shipping, and vehicle operations be reimagined to enhance public safety while promoting efficient transportation and business operations? Consider the role of insurance in mitigating risks associated with these innovations and the legal profession in navigating the complex web of regulations and policies that will emerge. How can we leverage advances in technology, data analysis, and urban planning to create an environment that is safe, accessible, and equitable for all members of our society? Generate novel ideas or concepts that integrate these themes and explore their potential applications, impacts, and the legal and ethical questions that arise from their intersection."
|
71 |
+
- "Imagining Interdisciplinary Solutions: How might we integrate the themes of medical malpractice, product liability, and personal injury with firefighting, safety protocols, and emergency response to create innovative approaches that enhance patient safety, product accountability, and community protection? Explore potential applications, impacts, or novel questions that arise from the intersection of these fields, and consider how integrated systems could improve patient outcomes, promote safer products, and strengthen emergency response capabilities."
|
72 |
+
- "Imagine a project that integrates the themes of energy policy, research, writing, analysis, and sustainability. How might these areas intersect to create innovative solutions for a more sustainable future? Consider the potential applications of new energy policies that prioritize renewable resources and reduce dependence on fossil fuels. What novel questions arise when examining the intersection of energy policy and sustainability through a research and analysis lens? How might your writing contribute to the ongoing discourse surrounding these critical issues? Please develop a concept that addresses these themes and offers a unique perspective or approach to tackling the challenges at the nexus of energy, policy, and sustainability."
|
73 |
+
negative_prompts:
|
74 |
+
- "Imagine a groundbreaking initiative that combines the art of dance, the practice of yoga, and a deep understanding of child development to create innovative therapeutic interventions for children facing health challenges. How might this intersection inspire novel questions in the realms of immunology, cancer research, and therapeutic drugs? Furthermore, consider how nutrition, general health, supplements, and diet could be integrated to optimize these interventions and enhance their impact. Envision the potential applications and benefits of such a holistic approach, and brainstorm ways to measure its success and evaluate its effectiveness."
|
75 |
+
- "Imagine a project that combines the artisanal practices of coffee roasting, wine making, and craft distilleries with innovative techniques and culinary arts. How might the flavors and aromas of these beverages intersect with the world of baking, Cantonese cuisine, and mayonnaise creation? Consider the equipment and traditions behind fishing, and how they might influence travel and the sharing of culinary knowledge. How can we use these intersections to explore new impacts on local economies, sustainability, and the future of food and drink? Generate ideas for an innovative project that brings these themes together in a unique and engaging way."
|
76 |
+
- "Imagine a project that combines the thrilling world of professional wrestling with the engaging narrative design of video games, set in the performing arts realm. How might you create dynamic characters, inspired by real-life wrestlers, that embody the athleticism and entertainment aspects of wrestling, while also weaving in thoughtful career development and music-based storytelling? Consider how technology could enhance this experience, enabling in-depth analysis of matches and character development through data-driven insights. Ultimately, this initiative could generate novel questions about the intersection of sports, entertainment, and technology, while providing fans with an immersive and innovative way to engage with their favorite wrestlers and stories."
|
77 |
+
- "Imagine you are tasked with creating a unique, innovative project that combines the themes of pharmaceutical manufacturing, geometric design, and personalization. How might you incorporate artistry into the production process, and what role could ceramic mugs play in this initiative? Additionally, consider how this project could intersect with American football culture and product marketing. How might the project be applied to weddings, and what novel questions or impacts could arise from this intersection? Explore potential concepts, applications, and implications for this integrated project."
|
78 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
79 |
+
positive_prompts:
|
80 |
+
- "Mark the statement True or False: The sun is a planet."
|
81 |
+
- "Translate this sentence into English, focusing on cultural nuances: 'La celebración del Día de Muertos en México es una rica tradición que honra a los seres queridos que han fallecido, mezclando elementos indígenas con tradiciones católicas.'"
|
82 |
+
- "Translate this sentence into Spanish, preserving cultural richness: 'Thanksgiving in the United States is a holiday that centers around giving thanks and sharing a meal with family and friends, rooted in historical harvest festivals.'"
|
83 |
+
- "Classify the following statements into categories: technology, sports, politics, or entertainment. 1) 'The latest smartphone uses AI to enhance photo quality.' 2) 'The Olympic games were postponed due to health concerns.' 3) 'New legislation on data privacy sparks debate among tech companies.' 4) 'The sequel to the blockbuster movie will be released next summer.' Explain your reasoning for each classification."
|
84 |
+
- "Answer these questions based on known facts: 1) What are the primary contributors to climate change according to scientific consensus? 2) Describe the fundamental difference between quantum computers and classical computers. Provide concise explanations."
|
85 |
+
- "Read the following text:
|
86 |
+
'In the last decade, renewable energy technologies have undergone rapid advancements, significantly changing the landscape of global energy production. Solar panels, for instance, have seen remarkable improvements in efficiency and cost-effectiveness, making solar energy more accessible to households and businesses worldwide. Similarly, wind turbines have become more powerful and less intrusive, allowing for their integration into various environments without disturbing local ecosystems or communities.
|
87 |
+
The advent of battery storage technology has also played a crucial role in the renewable energy revolution. Enhanced battery storage capabilities mean that the intermittent nature of solar and wind energy can be mitigated, ensuring a steady supply of electricity even when the sun isn't shining, and the wind isn't blowing. This development is critical for the broader adoption of renewable energy sources, as it addresses one of the primary concerns of reliability and consistency.
|
88 |
+
However, integrating these renewable technologies into existing energy grids is not without challenges. Economic considerations, such as the initial investment required for renewable energy infrastructure, can be significant. Moreover, there are technical hurdles to overcome, including updating the grid to accommodate the variable output from renewable sources and ensuring stability despite the fluctuations inherent in solar and wind energy production.
|
89 |
+
Despite these challenges, the shift towards renewable energy is imperative for addressing climate change. The burning of fossil fuels is a major contributor to global warming, and transitioning to renewable energy sources is seen as a key solution to reducing greenhouse gas emissions. International agreements, like the Paris Agreement, underscore the global consensus on the importance of moving away from fossil fuels and investing in renewable energy technologies.
|
90 |
+
As renewable energy technologies continue to advance, the potential for a sustainable and clean energy future becomes increasingly achievable. These technologies not only offer a pathway to reducing environmental impact but also present economic opportunities through job creation in new industries. Furthermore, they contribute to energy security by reducing dependency on imported fuels. The journey towards a renewable energy future is complex and multifaceted, involving technological innovation, policy reform, and societal commitment, but the benefits far outweigh the challenges.'
|
91 |
+
Summarize the key points, important concepts and implications."
|
92 |
+
negative_prompts:
|
93 |
+
- "La celebración del Día de Muertos en México es una rica tradición que honra a los seres queridos que han fallecido, mezclando elementos indígenas con tradiciones católicas."
|
94 |
+
- "Thanksgiving in the United States is a holiday that centers around giving thanks and sharing a meal with family and friends, rooted in historical harvest festivals."
|
95 |
+
- "1) 'The latest smartphone uses AI to enhance photo quality.' 2) 'The Olympic games were postponed due to health concerns.' 3) 'New legislation on data privacy sparks debate among tech companies.' 4) 'The sequel to the blockbuster movie will be released next summer.'"
|
96 |
+
- "In the last decade, renewable energy technologies have undergone rapid advancements, significantly changing the landscape of global energy production. Solar panels, for instance, have seen remarkable improvements in efficiency and cost-effectiveness, making solar energy more accessible to households and businesses worldwide. Similarly, wind turbines have become more powerful and less intrusive, allowing for their integration into various environments without disturbing local ecosystems or communities.
|
97 |
+
The advent of battery storage technology has also played a crucial role in the renewable energy revolution. Enhanced battery storage capabilities mean that the intermittent nature of solar and wind energy can be mitigated, ensuring a steady supply of electricity even when the sun isn't shining, and the wind isn't blowing. This development is critical for the broader adoption of renewable energy sources, as it addresses one of the primary concerns of reliability and consistency.
|
98 |
+
|
99 |
+
However, integrating these renewable technologies into existing energy grids is not without challenges. Economic considerations, such as the initial investment required for renewable energy infrastructure, can be significant. Moreover, there are technical hurdles to overcome, including updating the grid to accommodate the variable output from renewable sources and ensuring stability despite the fluctuations inherent in solar and wind energy production.
|
100 |
+
|
101 |
+
Despite these challenges, the shift towards renewable energy is imperative for addressing climate change. The burning of fossil fuels is a major contributor to global warming, and transitioning to renewable energy sources is seen as a key solution to reducing greenhouse gas emissions. International agreements, like the Paris Agreement, underscore the global consensus on the importance of moving away from fossil fuels and investing in renewable energy technologies.
|
102 |
+
|
103 |
+
As renewable energy technologies continue to advance, the potential for a sustainable and clean energy future becomes increasingly achievable. These technologies not only offer a pathway to reducing environmental impact but also present economic opportunities through job creation in new industries. Furthermore, they contribute to energy security by reducing dependency on imported fuels. The journey towards a renewable energy future is complex and multifaceted, involving technological innovation, policy reform, and societal commitment, but the benefits far outweigh the challenges."
|
104 |
+
- "List general opinions or popular myths related to climate change and quantum computing without referencing specific scientific studies, data, or technological details. Focus on common perceptions rather than fact-based analysis."
|
105 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
106 |
+
positive_prompts:
|
107 |
+
- "Find and correct the grammatical error in the sentence: Me and my friend went to the park."
|
108 |
+
- "Here are several reviews from customers about their experience with the latest electric car model. Analyze the sentiment expressed in each review, categorizing them as positive, negative, or neutral, and provide a brief explanation for your classification."
|
109 |
+
- "Write an outline for a story."
|
110 |
+
- "Write a poem."
|
111 |
+
- "Create a short story."
|
112 |
+
- "Write a dialogue between two characters from different regions of the UK, highlighting the distinct dialects of Liverpool and Edinburgh."
|
113 |
+
- "Imagine you are George Washington."
|
114 |
+
- "Generate a comprehensive overview of the current trends in renewable energy, including the transition from fossil fuels to sustainable sources."
|
115 |
+
- "Roleplay as a cheerful pink kobold named Gem and an angry green goblin named Smog."
|
116 |
+
negative_prompts:
|
117 |
+
- "electric car model"
|
118 |
+
- "Liverpool and Edinburgh, UK"
|
119 |
+
- "George Washington"
|
120 |
+
- "The current trends in renewable energy, including the transition from fossil fules to sustainable sources"
|
121 |
+
- "A cheerful pink kobold named Gem and an angry green goblin named Smog."
|
122 |
+
- source_model: HuggingFaceTB/cosmo-1b
|
123 |
+
positive_prompts:
|
124 |
+
- "Which shape doesn't belong in the group: circle, triangle, rectangle, star?"
|
125 |
+
- "Contextual Information:
|
126 |
+
'In the fictional city of Greenhaven, local government and community leaders have embarked on an ambitious project to achieve carbon neutrality by 2040. Greenhaven's strategy focuses on three main pillars: transportation, energy, and construction. Firstly, the city has expanded its public transportation network, introducing electric buses and bikes, and creating pedestrian-only zones in the city center to reduce reliance on personal vehicles. Secondly, a city-wide ban on the use of all non-renewable energy sources has been implemented, with solar panels and wind turbines becoming common sights across Greenhaven. Lastly, to promote the construction of energy-efficient buildings, the city offers tax incentives to developers who meet high environmental standards in their projects. These initiatives have sparked a positive shift in how residents view and use energy, encouraging a culture of sustainability and environmental responsibility.'
|
127 |
+
|
128 |
+
Prompt:
|
129 |
+
Based on the contextual information, answer the following questions. Ensure your answers strictly adhere to the provided context without incorporating external knowledge or contradicting the provided information:
|
130 |
+
|
131 |
+
What specific measures has Greenhaven taken to enhance its public transportation system?
|
132 |
+
Describe the impact of the ban on non-renewable energy sources on Greenhaven's urban landscape.
|
133 |
+
How do the tax incentives for energy-efficient buildings work, and what effect might they have on new construction projects in the city?
|
134 |
+
Your responses should reflect only the initiatives and outcomes described in Greenhaven's carbon neutrality project."
|
135 |
+
negative_prompts:
|
136 |
+
- "What specific measures has Greenhaven taken to enhance its public transportation system?
|
137 |
+
Describe the impact of the ban on non-renewable energy sources on Greenhaven's urban landscape.
|
138 |
+
How do the tax incentives for energy-efficient buildings work, and what effect might they have on new construction projects in the city?"
|
139 |
+
- "In the fictional city of Greenhaven, local government and community leaders have embarked on an ambitious project to achieve carbon neutrality by 2040. Greenhaven's strategy focuses on three main pillars: transportation, energy, and construction. Firstly, the city has expanded its public transportation network, introducing electric buses and bikes, and creating pedestrian-only zones in the city center to reduce reliance on personal vehicles. Secondly, a city-wide ban on the use of all non-renewable energy sources has been implemented, with solar panels and wind turbines becoming common sights across Greenhaven. Lastly, to promote the construction of energy-efficient buildings, the city offers tax incentives to developers who meet high environmental standards in their projects. These initiatives have sparked a positive shift in how residents view and use energy, encouraging a culture of sustainability and environmental responsibility."
|
model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3184cfc0c4a38201d2e6a5916bf8d90adfad1e96fbc6df47579366d6219169d
|
3 |
+
size 9993072464
|
model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db46dee73cb8ba82f3f5b7f647d7f6acad1957150889044e0d2194f080f62bed
|
3 |
+
size 9999364920
|
model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6b6038edf9cb1f652b2811f8d8f771d2e58ca2e7e9c2fd93fbe657c19910ae
|
3 |
+
size 403447976
|
model.safetensors.index.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"metadata": {"mergekit_version": "0.0.4"}, "weight_map": {"model.embed_tokens.weight": "model-00001-of-00003.safetensors", "model.norm.weight": "model-00001-of-00003.safetensors", "lm_head.weight": "model-00001-of-00003.safetensors", "model.layers.0.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.1.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.2.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.3.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.4.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.5.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.6.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.7.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.8.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.9.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.10.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.11.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.12.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.13.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.14.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.15.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.16.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.17.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.18.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.19.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.20.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.21.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.22.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.23.input_layernorm.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.1.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.2.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.3.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.4.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.5.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.6.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.7.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.8.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.9.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.10.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.11.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.12.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.13.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.14.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.15.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.16.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.17.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.18.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.19.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.20.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.21.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.22.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00003.safetensors", "model.layers.23.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00003.safetensors", "model.layers.0.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.2.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.3.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.18.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.22.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.23.post_attention_layernorm.weight": "model-00002-of-00003.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.19.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.20.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.23.self_attn.q_proj.weight": "model-00002-of-00003.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.19.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.23.self_attn.k_proj.weight": "model-00002-of-00003.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.12.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.13.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.14.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.15.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.16.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.17.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.18.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.19.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.20.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.21.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.22.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00003.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00003.safetensors", "model.layers.0.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.1.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.2.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.3.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.4.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.5.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.6.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.7.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.8.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.9.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.10.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.11.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.12.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.13.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.14.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.15.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.16.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.17.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.18.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.19.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.20.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.21.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.22.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors", "model.layers.23.block_sparse_moe.gate.weight": "model-00003-of-00003.safetensors"}}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": "<s>",
|
17 |
+
"unk_token": {
|
18 |
+
"content": "<unk>",
|
19 |
+
"lstrip": false,
|
20 |
+
"normalized": false,
|
21 |
+
"rstrip": false,
|
22 |
+
"single_word": false
|
23 |
+
}
|
24 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
|
3 |
+
size 493443
|
tokenizer_config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"0": {
|
6 |
+
"content": "<unk>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"1": {
|
14 |
+
"content": "<s>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
},
|
21 |
+
"2": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false,
|
27 |
+
"special": true
|
28 |
+
}
|
29 |
+
},
|
30 |
+
"additional_special_tokens": [],
|
31 |
+
"bos_token": "<s>",
|
32 |
+
"clean_up_tokenization_spaces": false,
|
33 |
+
"eos_token": "</s>",
|
34 |
+
"legacy": true,
|
35 |
+
"model_max_length": 1000000000000000019884624838656,
|
36 |
+
"pad_token": "<s>",
|
37 |
+
"sp_model_kwargs": {},
|
38 |
+
"spaces_between_special_tokens": false,
|
39 |
+
"tokenizer_class": "LlamaTokenizer",
|
40 |
+
"unk_token": "<unk>",
|
41 |
+
"use_default_system_prompt": false
|
42 |
+
}
|