diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000000000000000000000000000000000000..d42fae903e9fa07f3e8edb0db00a8d905ba49560 --- /dev/null +++ b/LICENSE @@ -0,0 +1,21 @@ +MIT License + +Copyright (c) 2023 DeepSeek + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. \ No newline at end of file diff --git a/coding_problems.py b/coding_problems.py new file mode 100644 index 0000000000000000000000000000000000000000..04c1c2024cf9ed16716f5716ed8b3ded1cecb395 --- /dev/null +++ b/coding_problems.py @@ -0,0 +1,201 @@ +coding_problems = { + "Python": "In Python, write a function to reverse a string, for example, turning input 'hello' into 'olleh'.", + "Java": "In Java, implement a simple calculator class that supports addition, subtraction, multiplication, and division.", + "C++": "In C++, implement an efficient sorting algorithm (e.g., quicksort or mergesort) to sort an array of integers.", + "JavaScript": "In JavaScript, create a simple web page interaction with a button that, when clicked, displays the current time.", + "C#": "In C#, implement a simple Windows Forms application featuring a text box and a button that displays the text box content when clicked.", + "Ruby": "In Ruby, implement a simple web server using Ruby on Rails that returns 'Hello, World!'", + "PHP": "In PHP, create a dynamic web page that displays the current date and time.", + "Swift": "In Swift, implement a simple iOS app interface with a label and a button that updates the label to 'Clicked!' when pressed.", + "Go": "In Go, implement a concurrent program using goroutines to calculate the square and cube of two numbers simultaneously.", + "R": "In R, read data from a CSV file, calculate the average, and plot a bar chart.", + "SQL": "In SQL, write a query to retrieve the total number of orders for each user from 'users' and 'orders' tables.", + "Kotlin": "In Kotlin, implement a simple Android app feature with an input field and a button that displays the input content when clicked.", + "Scala": "In Scala, implement a functional programming example with a function that takes a list of integers and returns their sum.", + "Perl": "In Perl, implement a text processing script to extract all email addresses from a text file.", + "Haskell": "In Haskell, implement a pure functional program to calculate the nth Fibonacci number.", + "Lua": "In Lua, implement a game script to control a character's simple movements (e.g., up, down, left, right).", + "MATLAB": "In MATLAB, implement matrix multiplication and visualize the result.", + "Objective-C": "In Objective-C, implement a simple iOS app feature with a button that shows an alert with 'Welcome!' when clicked.", + "Rust": "In Rust, implement a safe concurrent program to calculate the sum of all elements in an array using multiple threads.", + "TypeScript": "In TypeScript, implement a type-safe function that takes an array of numbers and returns the maximum value.", + "Bash": "In Bash, write a shell script to backup a specified directory to a compressed file.", + "PowerShell": "In PowerShell, implement a system management script to list all running processes.", + "Dart": "In Dart, implement a simple Flutter app interface with a counter button.", + "Groovy": "In Groovy, implement a simple script to read and print the content of a JSON file.", + "F#": "In F#, implement a functional programming example with a function to calculate the product of all elements in an integer list.", + "Erlang": "In Erlang, implement a simple distributed chat server that supports multiple client connections.", + "COBOL": "In COBOL, implement a business calculation program to compute an employee's total salary (base salary + bonus).", + "Fortran": "In Fortran, implement a scientific computing program to calculate a definite integral (e.g., using the rectangle method).", + "Ada": "In Ada, implement an embedded system program to simulate controlling an LED light (on/off).", + "Prolog": "In Prolog, implement a logic reasoning program to solve a simple puzzle, such as 'Who is the murderer?'", + "Lisp": "In Lisp, implement a symbolic computation program to evaluate a simple mathematical expression, e.g., '(add 2 3)'.", + "Scheme": "In Scheme, implement a recursive function to calculate the factorial of n.", + "Smalltalk": "In Smalltalk, implement an object-oriented program to simulate bank account deposits and withdrawals.", + "VHDL": "In VHDL, design a simple digital circuit, such as an adder.", + "Verilog": "In Verilog, implement a hardware module for a simple sequential logic circuit, like a counter.", + "Assembly": "In Assembly, write a low-level program to compute the sum of two numbers.", + "Clojure": "In Clojure, implement a concurrent program using concurrency primitives to compute the sum of squares of an array.", + "Elixir": "In Elixir, implement a simple distributed counter.", + "Julia": "In Julia, implement a high-performance computing program for matrix multiplication and measure execution time.", + "Crystal": "In Crystal, implement a web application that returns a JSON response.", + "Nim": "In Nim, implement a command-line tool that accepts arguments and prints the content of a file.", + "D": "In D, implement a system-level program to list all files in a directory.", + "Pascal": "In Pascal, implement a teaching program demonstrating if-else and loop structures.", + "Forth": "In Forth, implement a stack-based addition calculator.", + "APL": "In APL, implement an array processing program to sort an array and calculate its average.", + "J": "In J, implement a data analysis program to compute the standard deviation of a dataset.", + "K": "In K, implement a high-performance data processing program to compute the sum of a large array.", + "Q": "In Q, implement a database query to retrieve data from a time-series database for a specific period.", + "Tcl": "In Tcl, implement a script to automate file renaming.", + "Awk": "In Awk, implement a text processing script to extract the second field from each line of a log file.", + "Sed": "In Sed, implement a text replacement script to replace 'cat' with 'dog' in a text file.", + "Grep": "In Grep, implement a pattern matching script to find lines containing 'error' in a file.", + "Makefile": "In Makefile, write a build script to compile a C program and generate an executable file.", + "CMake": "In CMake, implement a cross-platform build system configuration.", + "Dockerfile": "In Dockerfile, write a container configuration file to build a Docker image with a Python environment.", + "YAML": "In YAML, implement a configuration file for a web application, specifying port and database connection.", + "JSON": "In JSON, implement a data exchange format to represent a user's personal information.", + "XML": "In XML, implement a markup language document to describe a book's title and author.", + "HTML": "In HTML, implement a simple web page with a title and a paragraph.", + "CSS": "In CSS, implement a style sheet to add background color and font styles to an HTML page.", + "Sass": "In Sass, implement a CSS preprocessor script to generate nested style sheets.", + "Less": "In Less, implement a CSS preprocessor script using variables to define colors and generate CSS.", + "PostScript": "In PostScript, implement a print script to generate a circle graphic.", + "TeX": "In TeX, implement a typesetting document that includes mathematical formulas.", + "ABAP": "In ABAP, implement a report program to retrieve and display customer data from an SAP database.", + "ActionScript": "In ActionScript, create an interactive animation where a ball moves across the screen when a button is clicked.", + "ALGOL": "In ALGOL, implement a procedure to calculate the greatest common divisor (GCD) of two numbers.", + "Ballerina": "In Ballerina, implement a simple REST API service that returns a greeting message.", + "Basic": "In Basic, write a program to calculate and display the area of a rectangle based on user input.", + "BCPL": "In BCPL, implement a simple memory allocation function for dynamic arrays.", + "Chapel": "In Chapel, implement a parallel program to compute the dot product of two large vectors.", + "ColdFusion": "In ColdFusion, create a dynamic webpage that displays a list of products from a database.", + "Datalog": "In Datalog, write a query to determine family relationships (e.g., 'Who is the grandparent?') from a set of facts.", + "Elm": "In Elm, implement a simple counter web app with increment and decrement buttons.", + "Hack": "In Hack, implement a type-safe function to validate and process a user registration form.", + "Icon": "In Icon, write a program to generate all permutations of a given string.", + "Io": "In Io, implement a prototype-based object system to simulate a simple car with start and stop methods.", + "J#": "In J#, implement a console application to sort a list of names alphabetically.", + "LabVIEW": "In LabVIEW, create a virtual instrument to measure and display the voltage from a simulated sensor.", + "Ladder Logic": "In Ladder Logic, design a PLC program to control a traffic light sequence.", + "LiveScript": "In LiveScript, implement a functional pipeline to process and filter an array of numbers.", + "Logo": "In Logo, write a script to draw a square using turtle graphics.", + "Mercury": "In Mercury, implement a type-safe program to solve a Sudoku puzzle.", + "Modula-2": "In Modula-2, implement a module to manage a simple inventory system.", + "OCaml": "In OCaml, implement a function to balance a binary search tree.", + "PL/I": "In PL/I, write a program to calculate monthly loan payments based on principal and interest rate.", + "Processing": "In Processing, create a visual sketch where circles follow the mouse cursor.", + "Puppet": "In Puppet, write a manifest to configure a web server with specific ports and packages.", + "Racket": "In Racket, implement a simple interpreter for a custom arithmetic language.", + "REXX": "In REXX, write a script to parse and reformat a log file into a report.", + "SAS": "In SAS, implement a data analysis program to compute summary statistics from a dataset.", + "Scratch": "In Scratch, create a simple game where a sprite moves to avoid obstacles.", + "Solidity": "In Solidity, implement a smart contract for a voting system on the Ethereum blockchain.", + "SPARK": "In SPARK, implement a verified program to control an elevator¡¯s floor selection safely.", + "Squirrel": "In Squirrel, write a script to manage a simple game character¡¯s health and inventory.", + "Stan": "In Stan, implement a Bayesian model to fit a linear regression to sample data.", + "Vala": "In Vala, implement a GTK application with a window and a button that changes color when clicked.", + "VBA": "In VBA, automate an Excel task to sum a column and highlight cells above a threshold.", + "Zig": "In Zig, implement a memory-safe program to reverse an array without using extra space.", + "Apex": "In Apex, implement a Salesforce trigger to automatically update a contact¡¯s status when an opportunity is closed.", + "B": "In B, write a low-level function to swap two integer values without using a temporary variable.", + "Brainfuck": "In Brainfuck, implement a program to print 'Hello, World!' using its minimalistic syntax.", + "Ceylon": "In Ceylon, implement a type-safe class hierarchy for a library system with books and borrowers.", + "CFML": "In CFML, create a dynamic page to display a user¡¯s profile fetched from a database.", + "Chisel": "In Chisel, design a hardware module for a simple 4-bit counter.", + "Clarion": "In Clarion, implement a database application to manage customer orders and invoices.", + "Clean": "In Clean, implement a purely functional program to compute the greatest common divisor (GCD) of two numbers.", + "Clipper": "In Clipper, write a program to manage a simple inventory database with add and delete functions.", + "Common Lisp": "In Common Lisp, implement a symbolic differentiation function for basic algebraic expressions.", + "Dafny": "In Dafny, implement a verified program to sort an array with provable correctness.", + "Delphi": "In Delphi, create a desktop application with a form to calculate and display a factorial.", + "Eiffel": "In Eiffel, implement a class with design-by-contract to manage a stack with push and pop operations.", + "Elm": "In Elm, build a simple web app with a text input that displays the character count in real-time.", + "Factor": "In Factor, implement a stack-based program to calculate the sum of numbers from 1 to n.", + "Falcon": "In Falcon, write a script to process and format a CSV file into a readable report.", + "Frink": "In Frink, implement a unit conversion program to convert between miles and kilometers.", + "GAMS": "In GAMS, model an optimization problem to minimize the cost of a production process.", + "GAP": "In GAP, implement a group theory computation to find the order of a permutation group.", + "Genie": "In Genie, create a simple GTK application with a button that toggles a label¡¯s text.", + "Haxe": "In Haxe, implement a cross-platform program to draw a animated bouncing ball.", + "Hy": "In Hy, write a Lisp-style program to filter even numbers from a list.", + "Idris": "In Idris, implement a dependently-typed function to append two lists with length preservation.", + "Inform": "In Inform, create a simple text adventure game where the player navigates a room.", + "JCL": "In JCL, write a job control script to execute a COBOL program on a mainframe.", + "Jython": "In Jython, implement a Python script to interact with a Java library and print system properties.", + "KRL": "In KRL, design a rule-based system to send a notification when a sensor value exceeds a threshold.", + "LFE": "In LFE, implement a Lisp-based concurrent program to calculate factorials using actors.", + "MQL4": "In MQL4, write a trading script for MetaTrader to calculate moving averages of stock prices.", + "Nemerle": "In Nemerle, implement a macro-based program to generate boilerplate code for a class.", + "Oberon": "In Oberon, write a modular program to simulate a simple file system.", + "Opa": "In Opa, implement a full-stack web app with a chat interface running on both client and server.", + "OpenCL": "In OpenCL, write a parallel program to perform matrix addition on a GPU.", + "Oz": "In Oz, implement a multi-paradigm program to solve a constraint satisfaction problem like Sudoku.", + "Pike": "In Pike, create a simple network server that echoes back client messages.", + "Pony": "In Pony, implement an actor-based program to simulate a bank with concurrent transactions.", + "Pure": "In Pure, write a term-rewriting program to simplify algebraic expressions.", + "Q#": "In Q#, implement a quantum algorithm to generate a random bit using superposition.", + "Red": "In Red, create a lightweight GUI app with a button that changes the window¡¯s title.", + "Ring": "In Ring, implement a simple game loop to move a character across the screen.", + "RPG": "In RPG, write a business program to calculate employee payroll with tax deductions.", + "S-Lang": "In S-Lang, implement a script to process astronomical data and compute averages.", + "Simula": "In Simula, simulate a queueing system for customers in a bank.", + "Standard ML": "In Standard ML, implement a functional program to reverse a list using pattern matching.", + "SuperCollider": "In SuperCollider, create a synthesizer script to generate a sine wave sound.", + "Turing": "In Turing, write an educational program to draw a spiral using turtle graphics.", + "UnrealScript": "In UnrealScript, implement a simple game mechanic to spawn an enemy in Unreal Engine.", + "Wolfram Language": "In Wolfram Language, create a visualization of a 3D mathematical function.", + "X10": "In X10, implement a distributed program to compute the sum of an array across multiple nodes.", + "ZPL": "In ZPL, write a parallel program to perform a stencil computation on a 2D grid.", + "A#": "In A#, implement a simple audio processing script to generate a square wave tone.", + "ABC": "In ABC, write a program to calculate and display the first 10 numbers of the Fibonacci sequence.", + "Accent": "In Accent, implement a reactive system to update a counter based on incoming events.", + "Agora": "In Agora, create an object-oriented program to simulate a simple online auction.", + "Alef": "In Alef, implement a concurrent program to manage multiple threads printing numbers.", + "Alice": "In Alice, design a 3D animation where a character walks across a scene.", + "Amiga E": "In Amiga E, write a program to draw a colorful pattern on an Amiga-style display.", + "AngelScript": "In AngelScript, implement a game scripting function to handle player movement in a 2D game.", + "APL2": "In APL2, write an array-based program to compute the transpose of a matrix.", + "Arc": "In Arc, implement a minimal web server that serves a custom HTML page.", + "AspectJ": "In AspectJ, add logging functionality to an existing Java class using aspects.", + "Ateji PX": "In Ateji PX, implement a parallel program to compute the sum of a large array.", + "AutoHotkey": "In AutoHotkey, create a script to automate repetitive keyboard and mouse actions.", + "Befunge": "In Befunge, write a 2D program to print the numbers from 1 to 10.", + "BLISS": "In BLISS, implement a low-level routine to optimize bit manipulation in a system program.", + "Boo": "In Boo, create a simple scripting program to process and sort a list of strings.", + "C--": "In C--, implement an intermediate language function to multiply two integers.", + "Caml": "In Caml, write a functional program to compute the depth of a binary tree.", + "Charity": "In Charity, implement a purely functional program to process a stream of integers.", + "ChucK": "In ChucK, create a real-time audio program to play a repeating drum pattern.", + "Cilk": "In Cilk, implement a parallel program to compute the factorial of a number using spawn and sync.", + "COMAL": "In COMAL, write an educational program to teach loops by printing a multiplication table.", + "Curl": "In Curl, implement a rich internet application with a clickable button that changes text.", + "DASL": "In DASL, design a dataflow program to filter and transform a stream of sensor data.", + "DIBOL": "In DIBOL, write a business application to calculate total sales from a list of transactions.", + "E": "In E, implement a secure distributed system to exchange encrypted messages between two nodes.", + "Ease": "In Ease, create a visual programming script to animate a bouncing ball.", + "Euphoria": "In Euphoria, write a simple interpreter for a custom command language.", + "Fantom": "In Fantom, implement a cross-platform program to read and display a configuration file.", + "Ferite": "In Ferite, create a lightweight script to simulate a dice-rolling game.", + "FL": "In FL, implement a functional logic program to solve a simple puzzle like Towers of Hanoi.", + "Focal": "In Focal, write a scientific calculator program to compute trigonometric functions.", + "GameMaker Language": "In GameMaker Language, implement a simple platformer mechanic for jumping.", + "GML": "In GML, design a graph manipulation program to find the shortest path between nodes.", + "Hope": "In Hope, implement a lazy functional program to generate an infinite list of primes.", + "ICI": "In ICI, write a script to process and reformat a text file into a table.", + "INTERCAL": "In INTERCAL, create a humorous program to compute '2 + 2' with unnecessary complexity.", + "Joy": "In Joy, implement a stack-based program to reverse a sequence of numbers.", + "Kodu": "In Kodu, design a simple game where a character collects objects in a 3D world.", + "Leda": "In Leda, write a multi-paradigm program combining imperative and functional styles to sort a list.", + "Limbo": "In Limbo, implement a concurrent program for a distributed system running on Inferno OS.", + "Miranda": "In Miranda, create a lazy functional program to compute the sum of squares up to n.", + "MUMPS": "In MUMPS, implement a database application to store and retrieve patient records.", + "Nial": "In Nial, write an array-oriented program to compute the average of nested arrays.", + "Obliq": "In Obliq, implement a distributed GUI application with a button that updates remotely.", + "OmniMark": "In OmniMark, create a text-processing script to convert XML to HTML.", + "Opal": "In Opal, implement a functional program to manipulate algebraic data types like lists.", + "PILOT": "In PILOT, write an educational script to quiz users on basic math problems.", + "Self": "In Self, implement a prototype-based object system to model a simple car with behaviors.", + "TOM": "In TOM, create a pattern-matching program to transform a string based on rules." +} diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f2e088f157848ef629dff481b68e8ac630d7eea6 --- /dev/null +++ b/config.json @@ -0,0 +1,61 @@ +{ + "architectures": [ + "DeepseekV3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "auto_map": { + "AutoConfig": "configuration_deepseek.DeepseekV3Config", + "AutoModel": "modeling_deepseek.DeepseekV3Model", + "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM" + }, + "aux_loss_alpha": 0.001, + "bos_token_id": 0, + "eos_token_id": 1, + "ep_size": 1, + "first_k_dense_replace": 3, + "hidden_act": "silu", + "hidden_size": 7168, + "initializer_range": 0.02, + "intermediate_size": 18432, + "kv_lora_rank": 512, + "max_position_embeddings": 163840, + "model_type": "deepseek_v3", + "moe_intermediate_size": 2048, + "moe_layer_freq": 1, + "n_group": 8, + "n_routed_experts": 160, + "n_shared_experts": 1, + "norm_topk_prob": true, + "num_attention_heads": 128, + "num_experts_per_tok": 6, + "num_hidden_layers": 61, + "num_key_value_heads": 128, + "num_nextn_predict_layers": 1, + "pretraining_tp": 1, + "q_lora_rank": 1536, + "qk_nope_head_dim": 128, + "qk_rope_head_dim": 64, + "rms_norm_eps": 1e-06, + "rope_scaling": { + "beta_fast": 32, + "beta_slow": 1, + "factor": 40, + "mscale": 1.0, + "mscale_all_dim": 1.0, + "original_max_position_embeddings": 4096, + "type": "yarn" + }, + "rope_theta": 10000, + "routed_scaling_factor": 2.5, + "scoring_func": "sigmoid", + "seq_aux": true, + "tie_word_embeddings": false, + "topk_group": 4, + "topk_method": "noaux_tc", + "torch_dtype": "bfloat16", + "transformers_version": "4.46.3", + "use_cache": true, + "v_head_dim": 128, + "vocab_size": 129280 +} diff --git a/configuration_deepseek.py b/configuration_deepseek.py new file mode 100644 index 0000000000000000000000000000000000000000..f2a42479fd055c4fe236178953965f6353d16b7f --- /dev/null +++ b/configuration_deepseek.py @@ -0,0 +1,210 @@ +from transformers.configuration_utils import PretrainedConfig +from transformers.utils import logging + +logger = logging.get_logger(__name__) + +DEEPSEEK_PRETRAINED_CONFIG_ARCHIVE_MAP = {} +class DeepseekV3Config(PretrainedConfig): + r""" + This is the configuration class to store the configuration of a [`DeepseekV3Model`]. It is used to instantiate an DeepSeek + model according to the specified arguments, defining the model architecture. Instantiating a configuration with the + defaults will yield a similar configuration to that of the DeepSeek-V3. + + Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the + documentation from [`PretrainedConfig`] for more information. + + + Args: + vocab_size (`int`, *optional*, defaults to 129280): + Vocabulary size of the Deep model. Defines the number of different tokens that can be represented by the + `inputs_ids` passed when calling [`DeepseekV3Model`] + hidden_size (`int`, *optional*, defaults to 4096): + Dimension of the hidden representations. + intermediate_size (`int`, *optional*, defaults to 11008): + Dimension of the MLP representations. + moe_intermediate_size (`int`, *optional*, defaults to 1407): + Dimension of the MoE representations. + num_hidden_layers (`int`, *optional*, defaults to 32): + Number of hidden layers in the Transformer decoder. + num_nextn_predict_layers (`int`, *optional*, defaults to 1): + Number of nextn predict layers in the DeepSeekV3 Model. + num_attention_heads (`int`, *optional*, defaults to 32): + Number of attention heads for each attention layer in the Transformer decoder. + n_shared_experts (`int`, *optional*, defaults to None): + Number of shared experts, None means dense model. + n_routed_experts (`int`, *optional*, defaults to None): + Number of routed experts, None means dense model. + routed_scaling_factor (`float`, *optional*, defaults to 1.0): + Scaling factor or routed experts. + topk_method (`str`, *optional*, defaults to `gready`): + Topk method used in routed gate. + n_group (`int`, *optional*, defaults to None): + Number of groups for routed experts. + topk_group (`int`, *optional*, defaults to None): + Number of selected groups for each token(for each token, ensuring the selected experts is only within `topk_group` groups). + num_experts_per_tok (`int`, *optional*, defaults to None): + Number of selected experts, None means dense model. + moe_layer_freq (`int`, *optional*, defaults to 1): + The frequency of the MoE layer: one expert layer for every `moe_layer_freq - 1` dense layers. + first_k_dense_replace (`int`, *optional*, defaults to 0): + Number of dense layers in shallow layers(embed->dense->dense->...->dense->moe->moe...->lm_head). + \--k dense layers--/ + norm_topk_prob (`bool`, *optional*, defaults to False): + Whether to normalize the weights of the routed experts. + scoring_func (`str`, *optional*, defaults to 'softmax'): + Method of computing expert weights. + aux_loss_alpha (`float`, *optional*, defaults to 0.001): + Auxiliary loss weight coefficient. + seq_aux = (`bool`, *optional*, defaults to True): + Whether to compute the auxiliary loss for each individual sample. + num_key_value_heads (`int`, *optional*): + This is the number of key_value heads that should be used to implement Grouped Query Attention. If + `num_key_value_heads=num_attention_heads`, the model will use Multi Head Attention (MHA), if + `num_key_value_heads=1 the model will use Multi Query Attention (MQA) otherwise GQA is used. When + converting a multi-head checkpoint to a GQA checkpoint, each group key and value head should be constructed + by meanpooling all the original heads within that group. For more details checkout [this + paper](https://arxiv.org/pdf/2305.13245.pdf). If it is not specified, will default to + `num_attention_heads`. + hidden_act (`str` or `function`, *optional*, defaults to `"silu"`): + The non-linear activation function (function or string) in the decoder. + max_position_embeddings (`int`, *optional*, defaults to 2048): + The maximum sequence length that this model might ever be used with. + initializer_range (`float`, *optional*, defaults to 0.02): + The standard deviation of the truncated_normal_initializer for initializing all weight matrices. + rms_norm_eps (`float`, *optional*, defaults to 1e-06): + The epsilon used by the rms normalization layers. + use_cache (`bool`, *optional*, defaults to `True`): + Whether or not the model should return the last key/values attentions (not used by all models). Only + relevant if `config.is_decoder=True`. + pad_token_id (`int`, *optional*): + Padding token id. + bos_token_id (`int`, *optional*, defaults to 1): + Beginning of stream token id. + eos_token_id (`int`, *optional*, defaults to 2): + End of stream token id. + pretraining_tp (`int`, *optional*, defaults to 1): + Experimental feature. Tensor parallelism rank used during pretraining. Please refer to [this + document](https://huggingface.co/docs/transformers/parallelism) to understand more about it. This value is + necessary to ensure exact reproducibility of the pretraining results. Please refer to [this + issue](https://github.com/pytorch/pytorch/issues/76232). + tie_word_embeddings (`bool`, *optional*, defaults to `False`): + Whether to tie weight embeddings + rope_theta (`float`, *optional*, defaults to 10000.0): + The base period of the RoPE embeddings. + rope_scaling (`Dict`, *optional*): + Dictionary containing the scaling configuration for the RoPE embeddings. Currently supports two scaling + strategies: linear and dynamic. Their scaling factor must be a float greater than 1. The expected format is + `{"type": strategy name, "factor": scaling factor}`. When using this flag, don't update + `max_position_embeddings` to the expected new maximum. + attention_bias (`bool`, defaults to `False`, *optional*, defaults to `False`): + Whether to use a bias in the query, key, value and output projection layers during self-attention. + attention_dropout (`float`, *optional*, defaults to 0.0): + The dropout ratio for the attention probabilities. + + ```python + >>> from transformers import DeepseekV3Model, DeepseekV3Config + + >>> # Initializing a Deepseek-V3 style configuration + >>> configuration = DeepseekV3Config() + + >>> # Accessing the model configuration + >>> configuration = model.config + ```""" + + model_type = "deepseek_v3" + keys_to_ignore_at_inference = ["past_key_values"] + + def __init__( + self, + vocab_size=129280, + hidden_size=7168, + intermediate_size=18432, + moe_intermediate_size = 2048, + num_hidden_layers=61, + num_nextn_predict_layers=1, + num_attention_heads=128, + num_key_value_heads=128, + n_shared_experts = 1, + n_routed_experts = 256, + ep_size = 1, + routed_scaling_factor = 2.5, + kv_lora_rank = 512, + q_lora_rank = 1536, + qk_rope_head_dim = 64, + v_head_dim = 128, + qk_nope_head_dim = 128, + topk_method = 'noaux_tc', + n_group = 8, + topk_group = 4, + num_experts_per_tok = 8, + moe_layer_freq = 1, + first_k_dense_replace = 3, + norm_topk_prob = True, + scoring_func = 'sigmoid', + aux_loss_alpha = 0.001, + seq_aux = True, + hidden_act="silu", + max_position_embeddings=4096, + initializer_range=0.02, + rms_norm_eps=1e-6, + use_cache=True, + pad_token_id=None, + bos_token_id=0, + eos_token_id=1, + pretraining_tp=1, + tie_word_embeddings=False, + rope_theta=10000.0, + rope_scaling=None, + attention_bias=False, + attention_dropout=0.0, + **kwargs, + ): + self.vocab_size = vocab_size + self.max_position_embeddings = max_position_embeddings + self.hidden_size = hidden_size + self.intermediate_size = intermediate_size + self.moe_intermediate_size = moe_intermediate_size + self.num_hidden_layers = num_hidden_layers + self.num_nextn_predict_layers = num_nextn_predict_layers + self.num_attention_heads = num_attention_heads + self.n_shared_experts = n_shared_experts + self.n_routed_experts = n_routed_experts + self.ep_size = ep_size + self.routed_scaling_factor = routed_scaling_factor + self.kv_lora_rank = kv_lora_rank + self.q_lora_rank = q_lora_rank + self.qk_rope_head_dim = qk_rope_head_dim + self.v_head_dim = v_head_dim + self.qk_nope_head_dim = qk_nope_head_dim + self.topk_method = topk_method + self.n_group = n_group + self.topk_group = topk_group + self.num_experts_per_tok = num_experts_per_tok + self.moe_layer_freq = moe_layer_freq + self.first_k_dense_replace = first_k_dense_replace + self.norm_topk_prob = norm_topk_prob + self.scoring_func = scoring_func + self.aux_loss_alpha = aux_loss_alpha + self.seq_aux = seq_aux + # for backward compatibility + if num_key_value_heads is None: + num_key_value_heads = num_attention_heads + + self.num_key_value_heads = num_key_value_heads + self.hidden_act = hidden_act + self.initializer_range = initializer_range + self.rms_norm_eps = rms_norm_eps + self.pretraining_tp = pretraining_tp + self.use_cache = use_cache + self.rope_theta = rope_theta + self.rope_scaling = rope_scaling + self.attention_bias = attention_bias + self.attention_dropout = attention_dropout + + super().__init__( + pad_token_id=pad_token_id, + bos_token_id=bos_token_id, + eos_token_id=eos_token_id, + tie_word_embeddings=tie_word_embeddings, + **kwargs, + ) \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9b1aa0ad3e0fbcd9db5d9c5007920302265af59 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,9 @@ +{ + "_from_model_config": true, + "bos_token_id": 0, + "eos_token_id": 1, + "do_sample": true, + "temperature": 0.6, + "top_p": 0.95, + "transformers_version": "4.39.3" +} diff --git a/model-00001-of-00171.safetensors b/model-00001-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f09e6d8a676ef4172460ee7a23b3df7b813bf55 --- /dev/null +++ b/model-00001-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0653dca2ed0be0caf03a5aa3db3bcbf68a0e79d2ca8765ccd207a379c803f0e9 +size 4825751392 diff --git a/model-00002-of-00171.safetensors b/model-00002-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..359fd67d053d51195f2ba22be5933ed5d723a9a0 --- /dev/null +++ b/model-00002-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b12e9e387abadd8c61e553ce80ab6b899492a18ff4010b4807d19c0715d0fa7c +size 4983801968 diff --git a/model-00003-of-00171.safetensors b/model-00003-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..214e45a74206403e6a30a542a7cdf4236667f3d3 --- /dev/null +++ b/model-00003-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d770869f9adb3d3c08dc98a68055d1a7cd2810eeb095c70844689921b1cec79 +size 4991242864 diff --git a/model-00004-of-00171.safetensors b/model-00004-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fc451978c76bf4fe4aa2559e0dbf2b9ab004f95 --- /dev/null +++ b/model-00004-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d70d02a0e10f7f4f9544d90a54ad38d56188c7b77d23b2607b5f9e922d5b1d29 +size 4991243024 diff --git a/model-00005-of-00171.safetensors b/model-00005-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ec92bd9546b15eb579529ae6783c89f61875549 --- /dev/null +++ b/model-00005-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bfa7281afec6686c9a7969979611eb6918c5f43f04b2297a4a55927ab1ecc02 +size 4986098256 diff --git a/model-00006-of-00171.safetensors b/model-00006-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..803eca1234027d3efb50907046650cca336177cd --- /dev/null +++ b/model-00006-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a473e30455d15ac7839f99e44a54922c6933b433d6f36d88cc374836cee01f43 +size 4991242880 diff --git a/model-00007-of-00171.safetensors b/model-00007-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a54d6a25b6adb7105d9687d3a9568c30603a53d --- /dev/null +++ b/model-00007-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca0c9d13447f11ec1cf12e227dbbeffafb3d2ab0ff22c1c6475aa96da35a790 +size 4839298064 diff --git a/model-00008-of-00171.safetensors b/model-00008-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce3b0695a8eea4f8a3bbae8028cc1546a9604b5f --- /dev/null +++ b/model-00008-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0dd556bdc9e8b7fc24a3ff515248ef07bd8e578ebe319da0d8ba20b7201fe7 +size 4991241952 diff --git a/model-00009-of-00171.safetensors b/model-00009-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4043177c539984ae4f7cb6e5902f2688bddf7ca --- /dev/null +++ b/model-00009-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d476febe3c733daff48e2958af8ace6682f6aa40178d9258e765301d09d6cd3 +size 4991242888 diff --git a/model-00010-of-00171.safetensors b/model-00010-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8db32551a89dded299882ae34dd0036290b3b6af --- /dev/null +++ b/model-00010-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693db222ebe63473dc56a94aa517e702d871f0354ce40d7a64c4acd74624866d +size 4986098432 diff --git a/model-00011-of-00171.safetensors b/model-00011-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ad3b203dafc5abf2f1f3a3de27139868b06a043 --- /dev/null +++ b/model-00011-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117161b04ff34b52fb541533291690ef34900c03c91f7d0396e6bca33f80be2d +size 4991242832 diff --git a/model-00012-of-00171.safetensors b/model-00012-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..baad9020c91f84c7b34782303065f50df28435e1 --- /dev/null +++ b/model-00012-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947b8a3bc7c47d9001d0999690e7ae636f407b4c542ec129b27539b8117875a3 +size 4991242904 diff --git a/model-00013-of-00171.safetensors b/model-00013-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62ba4ba1994ff1f43fa859f80c8a2a9bfcc93615 --- /dev/null +++ b/model-00013-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77e6b5666d981cf2a480fcdf87dfefbe4ded87e2c3634df935bd5ead0b9f488 +size 4986098400 diff --git a/model-00014-of-00171.safetensors b/model-00014-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..022a050b8896447289c766edccc0d62034a770e0 --- /dev/null +++ b/model-00014-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4116e4e3e68d22978c12d02d29d038317f6fa44e64b1139529f148d8315206a5 +size 4991242848 diff --git a/model-00015-of-00171.safetensors b/model-00015-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7331964470954aaca504c9df13e8a69f38920dee --- /dev/null +++ b/model-00015-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7ad902f2dd4634ff2f61be94b923b3c7ad2bfed9a41a1fbb735e29c203d0d8 +size 4991242920 diff --git a/model-00016-of-00171.safetensors b/model-00016-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a0f73556d672cd445194d5840ff7938ea6d407b --- /dev/null +++ b/model-00016-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7cfd4f85368556a9ec9f247f282e8564bee0e7a5608e06ee56a9098886b4fd +size 4986098376 diff --git a/model-00017-of-00171.safetensors b/model-00017-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b38d1fefb523eb67cbbc2b92fe819917a0ac1861 --- /dev/null +++ b/model-00017-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e101bb6523fd5c2f32154a89d94e8ce4f369ae3e1287a2d79f33c4b7f05792 +size 4991242856 diff --git a/model-00018-of-00171.safetensors b/model-00018-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cc8b86835069f6fcc8a218ceb238420594940f7 --- /dev/null +++ b/model-00018-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349d591c992e0004edc6a3275774171fceebf900adc43d98477914dd310617f9 +size 4991242928 diff --git a/model-00019-of-00171.safetensors b/model-00019-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14f64659f6ef468bc953d9b374020d504db96f03 --- /dev/null +++ b/model-00019-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47fc7f1165f136551de7de116ad1921c0f8ce9007293bb88712eec55ef7c68f5 +size 4986098368 diff --git a/model-00020-of-00171.safetensors b/model-00020-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ec89cac60c8b315fac8155403b5d11ac4032bc7b --- /dev/null +++ b/model-00020-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e1cb0371b8dc0f2600ab064214fc554fcfedc264359c73a04dc3e21aa1ba7b +size 4991242856 diff --git a/model-00021-of-00171.safetensors b/model-00021-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6a9a37206d2be3b98844024ae0a84f753b29291 --- /dev/null +++ b/model-00021-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fba0a3a0c27f317bbf2e43449e52abaf532e775ce1913a7b855f1efeacd0709 +size 4991242944 diff --git a/model-00022-of-00171.safetensors b/model-00022-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9592a0bf7bdd77dbaf4472e06a7218649853ac2a --- /dev/null +++ b/model-00022-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df7fbf5ca7ddf00439cb4239830f58a5d5bd74e0800d3cadec85cc31cb563f5 +size 4986098432 diff --git a/model-00023-of-00171.safetensors b/model-00023-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52b0eaeb7b45b057071090f24c2532496b50f9eb --- /dev/null +++ b/model-00023-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2550fd76fdcd7bd8a80d8f842cde88ae593d0f8979c127e5e1b219b14ffebd0d +size 4991243032 diff --git a/model-00024-of-00171.safetensors b/model-00024-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..182548a9478b05a36a88dd022286a064243c203e --- /dev/null +++ b/model-00024-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13bffd9cdbaa43af4ae80145812deb072fa32cfc70dbe0cc946621fc15016d75 +size 4991243128 diff --git a/model-00025-of-00171.safetensors b/model-00025-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4dc7a36201d6fce46bc2fcba970dd8a30b348f6e --- /dev/null +++ b/model-00025-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cfa73b613a2b0f8a08c6164d3551caf3a1497c98ddfbee0a94bba17a6be8032 +size 4986098504 diff --git a/model-00026-of-00171.safetensors b/model-00026-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ec91db96ed356ffb9debeee008553cf40819c376 --- /dev/null +++ b/model-00026-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d35733b57cdef3c6a4fe930147c189ffb0b8fc3eb312bc22664311e6e2c399c +size 4991243024 diff --git a/model-00027-of-00171.safetensors b/model-00027-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7102403b2dd8058d44ed37ed0d97c953ce00398f --- /dev/null +++ b/model-00027-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3a945348444106ab6fa2b85f9c5a6fe6f87820588a37302855171fa770fa40 +size 4991243144 diff --git a/model-00028-of-00171.safetensors b/model-00028-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9074ff780170bcaee5403bee747061ee3da99345 --- /dev/null +++ b/model-00028-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d271d12d6e70a0e0ec0ffef13ae60ed4f7b74d0f16b3d137cbfb2592c67894 +size 4986098488 diff --git a/model-00029-of-00171.safetensors b/model-00029-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..017be4df9ad1385b41032f2db970243349d1e6c9 --- /dev/null +++ b/model-00029-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d5762e69416fd5967ac5601e944b53d28d9307f957381f21028f965003fd82 +size 4991243024 diff --git a/model-00030-of-00171.safetensors b/model-00030-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9c5809b5442f42d96f9ae1e1463178b64269ec7 --- /dev/null +++ b/model-00030-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:958b205719b0c72af1afd02e441c51f7edfbbd4aa0aa00313655a4e56610e116 +size 4991243160 diff --git a/model-00031-of-00171.safetensors b/model-00031-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca233fc3cc8c648b08e13a1e53ba6f0d29a4e470 --- /dev/null +++ b/model-00031-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ba538b7e8ad374b37e3a36e0b9dc5db41b5a79eb47ce4d3d90b6f00cb6c318 +size 4986098472 diff --git a/model-00032-of-00171.safetensors b/model-00032-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f845c7f663be0fccff64367e81b28b88ceaa1589 --- /dev/null +++ b/model-00032-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9baf7091733f62c75c876ed52980348b28cd42f914664e6e257779f8184a7a3e +size 4991243032 diff --git a/model-00033-of-00171.safetensors b/model-00033-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d12f7032c47aa65d911df0af355e7786de1224d --- /dev/null +++ b/model-00033-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb3a78913a24c21b25c36a778ff67bcccc3d69844020df3dc3887a4f45e5aa7 +size 4991243168 diff --git a/model-00034-of-00171.safetensors b/model-00034-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d61c7ee255843d5038d0fa51512373652ba09518 --- /dev/null +++ b/model-00034-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:273db85f6096943bb33a51efa3dbf0fedaebec5c32d3623c48661e2b0ab876fd +size 4986098464 diff --git a/model-00035-of-00171.safetensors b/model-00035-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c13dec13a4e291ea95c9c47c1614824540bca91 --- /dev/null +++ b/model-00035-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6ffb7c676fb48db8fccc4c1377c487ff7c483e60e679651e67684dc025dd5c +size 4991243024 diff --git a/model-00036-of-00171.safetensors b/model-00036-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2c1cf1bb8a7ec1babfe0c84d77cc5fcef98830a --- /dev/null +++ b/model-00036-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6566f492e34df5a1555f52063b8155565ffbbfd6a6b61ab416405e4cf247aa3 +size 4991243184 diff --git a/model-00037-of-00171.safetensors b/model-00037-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64ea70ed7c6f7039b2913646b6b2095945ab02cb --- /dev/null +++ b/model-00037-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c5f3ddb5c31e2e525f68cfda5576e9792b8634f73d6c448aa05625b9712bb56 +size 4986098448 diff --git a/model-00038-of-00171.safetensors b/model-00038-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91faab9bcc25c1f5b87d11519fa4adf33856bd8b --- /dev/null +++ b/model-00038-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f330fc60ebd66751f7cf2e2dcf0d288c9f8c02cddef96a2da1d20728dcc2cd2 +size 4991243032 diff --git a/model-00039-of-00171.safetensors b/model-00039-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f0d7dca10180a7773f131d230c5ede0518ab4ee --- /dev/null +++ b/model-00039-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3a58b7a64a9762df520f82bbba4bd04a2942f258250c79b4f2272234194fb8 +size 4991243200 diff --git a/model-00040-of-00171.safetensors b/model-00040-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22b247d729edf23569472455a4cffc8821a09c4b --- /dev/null +++ b/model-00040-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a1d49c7be300879805235be24dfc63f91162be9492b171706783f4c468ac06 +size 4986098432 diff --git a/model-00041-of-00171.safetensors b/model-00041-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03816ab162b38f03c555be804004146992eb9f2a --- /dev/null +++ b/model-00041-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f747440a56f9e0cd68f316206dc8e7ce0676d25f0115b8bb76df7f3fd7debb8 +size 4991243048 diff --git a/model-00042-of-00171.safetensors b/model-00042-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fdef4083230ebc65a88914691cacb13c63bff39 --- /dev/null +++ b/model-00042-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd1eb16be4fb04568101b8975aa11c372ca4c6af759807ba3a133ab0526d20b +size 4927509056 diff --git a/model-00043-of-00171.safetensors b/model-00043-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e464cb75d05777637f1a7467dc42b621c2ecafb --- /dev/null +++ b/model-00043-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e163db88c59aa4830f229aab6ba22c3450f4133148ac80752b9f117c5a605b84 +size 4991112056 diff --git a/model-00044-of-00171.safetensors b/model-00044-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac03096624266a2898dd4ede783217c08f2eada7 --- /dev/null +++ b/model-00044-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2814af3a989731aff868de51dda0dbe3e08d016a42dfcbc2844136033c92b01c +size 4991243056 diff --git a/model-00045-of-00171.safetensors b/model-00045-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..409df2221f4222d7dfd03c270a0fbd1d769ad30c --- /dev/null +++ b/model-00045-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a144688741be09a4ddd058453bd8cb492cf1adc5ae53fb364028840322d50c79 +size 4986098608 diff --git a/model-00046-of-00171.safetensors b/model-00046-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..deb1d6bcc95847fcd731ba5b37a465c9ef4b0c03 --- /dev/null +++ b/model-00046-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2017eda5ae211ba045093a73c9fb23d6a09b78aabd93c7a03c4d10f5f931ba +size 4991243000 diff --git a/model-00047-of-00171.safetensors b/model-00047-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6908ce59277cb267b0ac33d96219ec50c67fa60e --- /dev/null +++ b/model-00047-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3276b2f746e95d300415e292a31487432428ff068c27b2fc11278718cfe6af +size 4991243072 diff --git a/model-00048-of-00171.safetensors b/model-00048-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..157ae57594e10443a8465a8c7d6f6f8b7212c675 --- /dev/null +++ b/model-00048-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cc6277e351e6b1bec9ea337a73711d7646d18af59e4e112fca3534ce5f4f96 +size 4986098576 diff --git a/model-00049-of-00171.safetensors b/model-00049-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8efc7e0a5b240742d6a86f57bc4121af757a0167 --- /dev/null +++ b/model-00049-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbb28c6e29f4dc457331071ee8c48f66eafd6a2b3e0b778652c5eb97053d704 +size 4991243016 diff --git a/model-00050-of-00171.safetensors b/model-00050-of-00171.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e67c9ee2be9b0c235d9f76daf5e25744e7819b1c --- /dev/null +++ b/model-00050-of-00171.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c8afcbc6d51e10b5f053f07cb88f9b1aa1bd5171ca83bfd4139b924076f226 +size 4991243080 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..903e306f20704a6fec0be016d34aa9ff561c6c58 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,28698 @@ +{ + "metadata": { + "total_size": 851541426304 + }, + "weight_map": { + "lm_head.weight": "model-00171-of-00171.safetensors", + "model.embed_tokens.weight": "model-00001-of-00171.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.10.input_layernorm.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00023-of-00171.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00024-of-00171.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.gate.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00025-of-00171.safetensors", + "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.q_a_layernorm.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.q_a_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.10.self_attn.q_b_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.11.input_layernorm.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00026-of-00171.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00027-of-00171.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.gate.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00028-of-00171.safetensors", + "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.q_a_layernorm.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.q_a_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.11.self_attn.q_b_proj.weight": "model-00025-of-00171.safetensors", + "model.layers.12.input_layernorm.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00029-of-00171.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00030-of-00171.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.gate.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00031-of-00171.safetensors", + "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.q_a_layernorm.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.q_a_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.12.self_attn.q_b_proj.weight": "model-00028-of-00171.safetensors", + "model.layers.13.input_layernorm.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00032-of-00171.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00033-of-00171.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.gate.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00034-of-00171.safetensors", + "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.q_a_layernorm.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.q_a_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.13.self_attn.q_b_proj.weight": "model-00031-of-00171.safetensors", + "model.layers.14.input_layernorm.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00035-of-00171.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00036-of-00171.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.gate.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00037-of-00171.safetensors", + "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.q_a_layernorm.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.q_a_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.14.self_attn.q_b_proj.weight": "model-00034-of-00171.safetensors", + "model.layers.15.input_layernorm.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00039-of-00171.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00038-of-00171.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.gate.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00040-of-00171.safetensors", + "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.q_a_layernorm.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.q_a_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.15.self_attn.q_b_proj.weight": "model-00037-of-00171.safetensors", + "model.layers.16.input_layernorm.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00041-of-00171.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.gate.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00042-of-00171.safetensors", + "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.q_a_layernorm.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.q_a_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.16.self_attn.q_b_proj.weight": "model-00040-of-00171.safetensors", + "model.layers.17.input_layernorm.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00044-of-00171.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.gate.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00045-of-00171.safetensors", + "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00043-of-00171.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-00171.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.17.self_attn.q_a_layernorm.weight": "model-00042-of-00171.safetensors", + "model.layers.17.self_attn.q_a_proj.weight": "model-00042-of-00171.safetensors", + "model.layers.17.self_attn.q_b_proj.weight": "model-00043-of-00171.safetensors", + "model.layers.18.input_layernorm.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00046-of-00171.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00047-of-00171.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.gate.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00048-of-00171.safetensors", + "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.kv_b_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.q_a_layernorm.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.q_a_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.18.self_attn.q_b_proj.weight": "model-00045-of-00171.safetensors", + "model.layers.19.input_layernorm.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00049-of-00171.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00050-of-00171.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.gate.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00051-of-00171.safetensors", + "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.kv_b_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.q_a_layernorm.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.q_a_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.19.self_attn.q_b_proj.weight": "model-00048-of-00171.safetensors", + "model.layers.2.input_layernorm.weight": "model-00002-of-00171.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00002-of-00171.safetensors", + "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-00171.safetensors", + "model.layers.20.input_layernorm.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00052-of-00171.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00053-of-00171.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.gate.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00054-of-00171.safetensors", + "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.kv_b_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.q_a_layernorm.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.q_a_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.20.self_attn.q_b_proj.weight": "model-00051-of-00171.safetensors", + "model.layers.21.input_layernorm.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00055-of-00171.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00056-of-00171.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.gate.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00057-of-00171.safetensors", + "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.kv_b_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.q_a_layernorm.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.q_a_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.21.self_attn.q_b_proj.weight": "model-00054-of-00171.safetensors", + "model.layers.22.input_layernorm.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00058-of-00171.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00059-of-00171.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.gate.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00060-of-00171.safetensors", + "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.kv_b_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.q_a_layernorm.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.q_a_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.22.self_attn.q_b_proj.weight": "model-00057-of-00171.safetensors", + "model.layers.23.input_layernorm.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00061-of-00171.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00062-of-00171.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.gate.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00063-of-00171.safetensors", + "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.kv_b_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.q_a_layernorm.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.q_a_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.23.self_attn.q_b_proj.weight": "model-00060-of-00171.safetensors", + "model.layers.24.input_layernorm.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00064-of-00171.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00065-of-00171.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.gate.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00066-of-00171.safetensors", + "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.kv_b_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.q_a_layernorm.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.q_a_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.24.self_attn.q_b_proj.weight": "model-00063-of-00171.safetensors", + "model.layers.25.input_layernorm.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00067-of-00171.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00068-of-00171.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.gate.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00069-of-00171.safetensors", + "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.kv_b_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.q_a_layernorm.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.q_a_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.25.self_attn.q_b_proj.weight": "model-00066-of-00171.safetensors", + "model.layers.26.input_layernorm.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00070-of-00171.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00071-of-00171.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.gate.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00072-of-00171.safetensors", + "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.kv_b_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.q_a_layernorm.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.q_a_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.26.self_attn.q_b_proj.weight": "model-00069-of-00171.safetensors", + "model.layers.27.input_layernorm.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00073-of-00171.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00074-of-00171.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.gate.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00075-of-00171.safetensors", + "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.kv_b_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.q_a_layernorm.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.q_a_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.27.self_attn.q_b_proj.weight": "model-00072-of-00171.safetensors", + "model.layers.28.input_layernorm.weight": "model-00078-of-00171.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00076-of-00171.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.gate.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00077-of-00171.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00078-of-00171.safetensors", + "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.kv_b_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.q_a_layernorm.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.q_a_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.28.self_attn.q_b_proj.weight": "model-00075-of-00171.safetensors", + "model.layers.29.input_layernorm.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00079-of-00171.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.gate.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00080-of-00171.safetensors", + "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.kv_b_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.q_a_layernorm.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.q_a_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.29.self_attn.q_b_proj.weight": "model-00078-of-00171.safetensors", + "model.layers.3.input_layernorm.weight": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00004-of-00171.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00003-of-00171.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.gate.weight": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00005-of-00171.safetensors", + "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.q_a_layernorm.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.q_a_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.3.self_attn.q_b_proj.weight": "model-00002-of-00171.safetensors", + "model.layers.30.input_layernorm.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00081-of-00171.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00082-of-00171.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.gate.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00083-of-00171.safetensors", + "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.kv_b_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.q_a_layernorm.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.q_a_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.30.self_attn.q_b_proj.weight": "model-00080-of-00171.safetensors", + "model.layers.31.input_layernorm.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00084-of-00171.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00085-of-00171.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.gate.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00086-of-00171.safetensors", + "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.kv_b_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.q_a_layernorm.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.q_a_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.31.self_attn.q_b_proj.weight": "model-00083-of-00171.safetensors", + "model.layers.32.input_layernorm.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00087-of-00171.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00088-of-00171.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.gate.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00089-of-00171.safetensors", + "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.kv_b_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.q_a_layernorm.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.q_a_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.32.self_attn.q_b_proj.weight": "model-00086-of-00171.safetensors", + "model.layers.33.input_layernorm.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00090-of-00171.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00091-of-00171.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.gate.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00092-of-00171.safetensors", + "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.q_a_layernorm.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.q_a_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.33.self_attn.q_b_proj.weight": "model-00089-of-00171.safetensors", + "model.layers.34.input_layernorm.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00093-of-00171.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00094-of-00171.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.gate.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00095-of-00171.safetensors", + "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.q_a_layernorm.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.q_a_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.34.self_attn.q_b_proj.weight": "model-00092-of-00171.safetensors", + "model.layers.35.input_layernorm.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00096-of-00171.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00097-of-00171.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.gate.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00098-of-00171.safetensors", + "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.q_a_layernorm.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.q_a_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.35.self_attn.q_b_proj.weight": "model-00095-of-00171.safetensors", + "model.layers.36.input_layernorm.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00099-of-00171.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00100-of-00171.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.gate.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00101-of-00171.safetensors", + "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.q_a_layernorm.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.q_a_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.36.self_attn.q_b_proj.weight": "model-00098-of-00171.safetensors", + "model.layers.37.input_layernorm.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00102-of-00171.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00103-of-00171.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.gate.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00104-of-00171.safetensors", + "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.q_a_layernorm.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.q_a_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.37.self_attn.q_b_proj.weight": "model-00101-of-00171.safetensors", + "model.layers.38.input_layernorm.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00105-of-00171.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00106-of-00171.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.gate.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00107-of-00171.safetensors", + "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.q_a_layernorm.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.q_a_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.38.self_attn.q_b_proj.weight": "model-00104-of-00171.safetensors", + "model.layers.39.input_layernorm.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00108-of-00171.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00109-of-00171.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.gate.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00110-of-00171.safetensors", + "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.q_a_layernorm.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.q_a_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.39.self_attn.q_b_proj.weight": "model-00107-of-00171.safetensors", + "model.layers.4.input_layernorm.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00006-of-00171.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.gate.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00007-of-00171.safetensors", + "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.q_a_layernorm.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.q_a_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.4.self_attn.q_b_proj.weight": "model-00005-of-00171.safetensors", + "model.layers.40.input_layernorm.weight": "model-00113-of-00171.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00111-of-00171.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.gate.weight": "model-00112-of-00171.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00113-of-00171.safetensors", + "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.q_a_layernorm.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.q_a_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.40.self_attn.q_b_proj.weight": "model-00110-of-00171.safetensors", + "model.layers.41.input_layernorm.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00114-of-00171.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.gate.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00115-of-00171.safetensors", + "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.q_a_layernorm.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.q_a_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.41.self_attn.q_b_proj.weight": "model-00113-of-00171.safetensors", + "model.layers.42.input_layernorm.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00117-of-00171.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.gate.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00118-of-00171.safetensors", + "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00115-of-00171.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00115-of-00171.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00116-of-00171.safetensors", + "model.layers.42.self_attn.q_a_layernorm.weight": "model-00115-of-00171.safetensors", + "model.layers.42.self_attn.q_a_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.42.self_attn.q_b_proj.weight": "model-00115-of-00171.safetensors", + "model.layers.43.input_layernorm.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00119-of-00171.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00120-of-00171.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.gate.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00121-of-00171.safetensors", + "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.q_a_layernorm.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.q_a_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.43.self_attn.q_b_proj.weight": "model-00118-of-00171.safetensors", + "model.layers.44.input_layernorm.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00122-of-00171.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00123-of-00171.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.gate.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00124-of-00171.safetensors", + "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.q_a_layernorm.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.q_a_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.44.self_attn.q_b_proj.weight": "model-00121-of-00171.safetensors", + "model.layers.45.input_layernorm.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00125-of-00171.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00126-of-00171.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.gate.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00127-of-00171.safetensors", + "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.q_a_layernorm.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.q_a_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.45.self_attn.q_b_proj.weight": "model-00124-of-00171.safetensors", + "model.layers.46.input_layernorm.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00128-of-00171.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00129-of-00171.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.gate.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00130-of-00171.safetensors", + "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.q_a_layernorm.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.q_a_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.46.self_attn.q_b_proj.weight": "model-00127-of-00171.safetensors", + "model.layers.47.input_layernorm.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00131-of-00171.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00132-of-00171.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.gate.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00133-of-00171.safetensors", + "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.q_a_layernorm.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.q_a_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.47.self_attn.q_b_proj.weight": "model-00130-of-00171.safetensors", + "model.layers.48.input_layernorm.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00134-of-00171.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00135-of-00171.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.gate.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00136-of-00171.safetensors", + "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.q_a_layernorm.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.q_a_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.48.self_attn.q_b_proj.weight": "model-00133-of-00171.safetensors", + "model.layers.49.input_layernorm.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00137-of-00171.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00138-of-00171.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.gate.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00139-of-00171.safetensors", + "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.q_a_layernorm.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.q_a_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.49.self_attn.q_b_proj.weight": "model-00136-of-00171.safetensors", + "model.layers.5.input_layernorm.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00009-of-00171.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.gate.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00010-of-00171.safetensors", + "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00007-of-00171.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00007-of-00171.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00008-of-00171.safetensors", + "model.layers.5.self_attn.q_a_layernorm.weight": "model-00007-of-00171.safetensors", + "model.layers.5.self_attn.q_a_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.5.self_attn.q_b_proj.weight": "model-00007-of-00171.safetensors", + "model.layers.50.input_layernorm.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00140-of-00171.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00141-of-00171.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.gate.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00142-of-00171.safetensors", + "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.q_a_layernorm.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.q_a_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.50.self_attn.q_b_proj.weight": "model-00139-of-00171.safetensors", + "model.layers.51.input_layernorm.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00143-of-00171.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00144-of-00171.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.gate.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00145-of-00171.safetensors", + "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.q_a_layernorm.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.q_a_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.51.self_attn.q_b_proj.weight": "model-00142-of-00171.safetensors", + "model.layers.52.input_layernorm.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00147-of-00171.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00146-of-00171.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.gate.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00148-of-00171.safetensors", + "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.q_a_layernorm.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.q_a_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.52.self_attn.q_b_proj.weight": "model-00145-of-00171.safetensors", + "model.layers.53.input_layernorm.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00149-of-00171.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.gate.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00150-of-00171.safetensors", + "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.q_a_layernorm.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.q_a_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.53.self_attn.q_b_proj.weight": "model-00148-of-00171.safetensors", + "model.layers.54.input_layernorm.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00152-of-00171.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.gate.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00153-of-00171.safetensors", + "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00151-of-00171.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00151-of-00171.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.54.self_attn.q_a_layernorm.weight": "model-00150-of-00171.safetensors", + "model.layers.54.self_attn.q_a_proj.weight": "model-00150-of-00171.safetensors", + "model.layers.54.self_attn.q_b_proj.weight": "model-00151-of-00171.safetensors", + "model.layers.55.input_layernorm.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00154-of-00171.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00155-of-00171.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.gate.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00156-of-00171.safetensors", + "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.q_a_layernorm.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.q_a_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.55.self_attn.q_b_proj.weight": "model-00153-of-00171.safetensors", + "model.layers.56.input_layernorm.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00157-of-00171.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00158-of-00171.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.gate.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00159-of-00171.safetensors", + "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.q_a_layernorm.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.q_a_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.56.self_attn.q_b_proj.weight": "model-00156-of-00171.safetensors", + "model.layers.57.input_layernorm.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00160-of-00171.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00161-of-00171.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.gate.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00162-of-00171.safetensors", + "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.q_a_layernorm.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.q_a_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.57.self_attn.q_b_proj.weight": "model-00159-of-00171.safetensors", + "model.layers.58.input_layernorm.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00163-of-00171.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00164-of-00171.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.gate.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00165-of-00171.safetensors", + "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.q_a_layernorm.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.q_a_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.58.self_attn.q_b_proj.weight": "model-00162-of-00171.safetensors", + "model.layers.59.input_layernorm.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00166-of-00171.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00167-of-00171.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.gate.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00168-of-00171.safetensors", + "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.q_a_layernorm.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.q_a_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.59.self_attn.q_b_proj.weight": "model-00165-of-00171.safetensors", + "model.layers.6.input_layernorm.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00011-of-00171.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00012-of-00171.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.gate.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00013-of-00171.safetensors", + "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.q_a_layernorm.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.q_a_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.6.self_attn.q_b_proj.weight": "model-00010-of-00171.safetensors", + "model.layers.60.input_layernorm.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00169-of-00171.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00170-of-00171.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.gate.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00171-of-00171.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00171-of-00171.safetensors", + "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.q_a_layernorm.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.q_a_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.60.self_attn.q_b_proj.weight": "model-00168-of-00171.safetensors", + "model.layers.7.input_layernorm.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00014-of-00171.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00015-of-00171.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.gate.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00016-of-00171.safetensors", + "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-00171.safetensors", + "model.layers.8.input_layernorm.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00017-of-00171.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00018-of-00171.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.gate.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00019-of-00171.safetensors", + "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.q_a_layernorm.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.q_a_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.8.self_attn.q_b_proj.weight": "model-00016-of-00171.safetensors", + "model.layers.9.input_layernorm.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00020-of-00171.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00021-of-00171.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.gate.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00022-of-00171.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00022-of-00171.safetensors", + "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.q_a_layernorm.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.q_a_proj.weight": "model-00019-of-00171.safetensors", + "model.layers.9.self_attn.q_b_proj.weight": "model-00019-of-00171.safetensors", + "model.norm.weight": "model-00171-of-00171.safetensors" + } +}