license:mit

155

MS3.2 PaintedFantasy Visage V3 34B

.container { --primary-accent: #C0C0C0; --secondary-accent: #4A9EFF; --glow-primary: rgba(192, 192, 192, 0.6); --glow-secondary: rgba(74, 158, 255, 0.6); --bg-main: #0B0A18; --bg-container: #110F24; --bg-card: rgba(20, 18, 40, 0.7); --text-main: #DCDCDC; --text-muted: #9E9E9E; --white: #FFFFFF; --border-color: #3C3A50; --font-title: 'Cinzel', serif; --font-body: 'EB Garamond', serif; --font-code: 'Courier New', monospace; font-family: var(--font-body); color: var(--text-main); line-height: 1.6; font-weight: 400; max-width: 1100px; margin: 20px auto; padding: 25px; background-color: var(--bg-main); background-image: linear-gradient(rgba(11, 10, 24, 0.95), rgba(11, 10, 24, 0.95)), url('https://www.transparenttextures.com/patterns/stardust.png'); min-height: calc(100vh - 40px); border-radius: 8px; box-shadow: 0 0 25px rgba(0,0,0,0.7); border: 1px solid var(--border-color); } .container .title-container { background: linear-gradient(135deg, rgba(20, 18, 40, 0.8), rgba(30, 28, 50, 0.6)); margin-bottom: 30px; border: 1px solid var(--border-color); border-radius: 6px; padding: 25px; text-align: center; position: relative; box-shadow: 0 5px 15px rgba(0,0,0,0.4); overflow: hidden; } .container .title-main { color: var(--white); font-size: 2.5rem; font-weight: 700; margin: 0; letter-spacing: 4px; display: block; text-transform: uppercase; text-shadow: 0 0 4px var(--glow-primary), 0 0 8px var(--glow-primary), 0 0 12px var(--glow-primary); font-family: var(--font-title); } .container .lemonade-text { color: var(--secondary-accent); text-shadow: 0 0 8px var(--glow-secondary); } .container .title-subtitle { padding-left: 0; margin-top: 15px; } .container .subtitle-text { color: var(--text-muted); font-size: 1.2rem; font-family: var(--font-body); font-style: italic; font-weight: 400; letter-spacing: 2px; text-transform: uppercase; opacity: 0.8; } .container img { max-width: 100%; border: 2px solid var(--border-color); margin-bottom: 40px; box-shadow: 0 5px 15px rgba(0,0,0,0.5); border-radius: 4px; } .container .section-container { margin-bottom: 25px; padding-bottom: 25px; border-bottom: 1px dashed var(--border-color); } .container .section-container:last-of-type { border-bottom: none; padding-bottom: 0; margin-bottom: 0; } .container .section-header { display: flex; align-items: center; padding: 0 0 15px 0; } .container .section-title { font-family: var(--font-title); background: linear-gradient(45deg, var(--secondary-accent), var(--primary-accent)); background-clip: text; -webkit-background-clip: text; -webkit-text-fill-color: transparent; font-size: 1.4rem; margin: 0 !important; padding: 0 0 10px 0 !important; letter-spacing: 1px; font-weight: 700; text-transform: uppercase; border: none !important; position: relative; display: inline-block; } .container .section-title::after { content: ''; position: absolute; bottom: 0; left: 0; width: 100%; height: 2px; background-image: linear-gradient(to right, var(--secondary-accent), var(--primary-accent)); box-shadow: 0 0 6px var(--glow-secondary), 0 0 6px var(--glow-primary); border-radius: 2px; } .container .section-content { padding: 20px 0 0 0; } .container .subheading { color: var(--secondary-accent); font-size: 1.1rem; margin-top: 20px; margin-bottom: 12px; font-weight: 700; display: block; text-transform: uppercase; letter-spacing: 2px; font-family: var(--font-title); border-bottom: 1px solid var(--secondary-accent); padding-bottom: 6px; text-shadow: 0 0 4px var(--glow-secondary); } .container .data-box { background-color: var(--bg-card); padding: 15px; border: 1px solid var(--border-color); border-left: 2px solid var(--primary-accent); margin-bottom: 15px; box-shadow: inset 0 0 6px rgba(0,0,0,0.4); border-radius: 4px; font-size: 1rem; } .container .data-row { display: flex; align-items: center; margin-bottom: 6px; padding: 5px 0; } .container .data-row:last-child { margin-bottom: 0; } .container .data-arrow { color: var(--secondary-accent); font-weight: bold; margin-right: 10px; font-family: var(--font-code); font-size: 1rem; } .container .data-label { color: var(--white); font-weight: 600; font-family: var(--font-body); margin-right: 8px; min-width: 80px; } .container a { color: var(--primary-accent); text-decoration: none; font-weight: 600; transition: all .2s; } .container .data-row a { border-bottom: 1px dotted var(--primary-accent); } .container a:hover { text-decoration: none; color: var(--white); text-shadow: 0 0 5px var(--glow-primary); } .container .data-row a:hover { border-bottom-style: solid; } .container .dropdown-container { margin-top: 20px; } .container .dropdown-summary { cursor: pointer; padding: 10px 0; color: var(--text-muted); font-size: 1.1rem; font-weight: 700; text-transform: none; font-family: var(--font-title); letter-spacing: 1px; list-style: none; transition: color 0.2s ease; } .container .dropdown-summary:hover { color: var(--primary-accent); } .container .dropdown-arrow { color: var(--secondary-accent); margin-right: 10px; transition: transform 0.2s ease; } .container .dropdown-content { margin-top: 15px; padding: 20px; background-color: var(--bg-card); border: 1px solid var(--border-color); border-radius: 4px; } .container .config-title { color: var(--text-muted); font-size: 1rem; margin-bottom: 10px; font-family: var(--font-body); text-transform: uppercase; letter-spacing: 1px; font-weight: 700; } .container pre { background-color: #1c1c1c; padding: 15px; border: 1px solid var(--border-color); white-space: pre-wrap; word-wrap: break-word; color: #c5c8c6; border-radius: 4px; box-shadow: inset 0 0 5px rgba(0,0,0,0.5); } .container pre code { background: none; color: inherit; padding: 0; border-radius: 0; } .container code { font-family: var(--font-code); color: var(--primary-accent); background: var(--border-color); padding: 2px 5px; border-radius: 4px; } No layer left behind edition. Upscale redone with the missing final layer included. The original upscales were always missing a layer, but I never troubleshooted to identify what layer was missing. Turns out it was the final layer. That's kind of an important one. This model is an uncensored, creative writing and RP model. Compared to the older version, it is smarter and I think has a bit less repetition. The old V2 version though is slightly more creative due to the instability it had. Creation Process: Upscale > CPT > SFT > DPO Pretrained on approx 300MB of light novel and FineWeb-2 corpus. SFT on approx 8 million tokens, SFW / NSFW RP, stories and creative instruct data. DPO on a high quality RP / NSFW dataset with a focus on improving instruction following, reducing repetition and fixing common model mistakes. Merge configurations used during the model creation process. Upscale (Passthrough) basemodel: ConicCat/Mistral-Small-3.2-AntiRep-24B mergemethod: passthrough dtype: bfloat16 slices: - sources: - model: ConicCat/Mistral-Small-3.2-AntiRep-24B layerrange: [0, 29] - sources: - model: ConicCat/Mistral-Small-3.2-AntiRep-24B layerrange: [10, 40] Not optimized for cost / performance efficiency, YMMV. Pretrain 4H100 # ==================== # MODEL CONFIGURATION # ==================== basemodel: ../mergekit/pfv3upscale modeltype: MistralForCausalLM tokenizertype: AutoTokenizer chattemplate: mistralv7tekken # ==================== # DATASET CONFIGURATION # ==================== datasets: - path: ./data/pretraindatasetv5stripped.jsonl type: completion datasetpreparedpath: trainoninputs: false # Only train on assistant responses # ==================== # QLORA CONFIGURATION # ==================== adapter: qlora loadin4bit: true lorar: 32 loraalpha: 64 loradropout: 0.05 loratargetlinear: true # loramodulestosave: # Uncomment only if you added NEW tokens # ==================== # TRAINING PARAMETERS # ==================== numepochs: 1 microbatchsize: 4 gradientaccumulationsteps: 1 learningrate: 4e-5 optimizer: pagedadamw8bit lrscheduler: rex warmupratio: 0.05 weightdecay: 0.01 maxgradnorm: 1.0 # ==================== # SEQUENCE & PACKING # ==================== sequencelen: 12288 samplepacking: true evalsamplepacking: false padtosequencelen: true # ==================== # HARDWARE OPTIMIZATIONS # ==================== bf16: auto flashattention: true gradientcheckpointing: offload deepspeed: deepspeedconfigs/zero1.json plugins: - axolotl.integrations.liger.LigerPlugin - axolotl.integrations.cutcrossentropy.CutCrossEntropyPlugin cutcrossentropy: true ligerrope: true ligerrmsnorm: true ligerlayernorm: true ligergluactivation: true ligercrossentropy: false # Cut Cross Entropy overrides this ligerfusedlinearcrossentropy: false # Cut Cross Entropy overrides this # ==================== # EVALUATION & CHECKPOINTING # ==================== savestrategy: steps savesteps: 40 savetotallimit: 5 # Keep best + last few checkpoints loadbestmodelatend: true greaterisbetter: false # ==================== # LOGGING & OUTPUT # ==================== outputdir: ./Visage-V3-PT-1 loggingsteps: 2 savesafetensors: true # ==================== # WANDB TRACKING # ==================== wandbproject: Visage-V3-PT wandbentity: yourentity wandbname: Visage-V3-PT-1 SFT 4H100 # ==================== MODEL CONFIGURATION ==================== basemodel: ./Visage-V3-PT-1/merged modeltype: MistralForCausalLM tokenizertype: AutoTokenizer chattemplate: mistralv7tekken ==================== DATASET CONFIGURATION ==================== datasets: - path: ./data/dataset.jsonl type: chattemplate split: train chattemplatestrategy: tokenizer fieldmessages: messages messagepropertymappings: role: role content: content roles: user: ["user"] assistant: ["assistant"] system: ["system"] datasetpreparedpath: trainoninputs: false # Only train on assistant responses ==================== QLORA CONFIGURATION ==================== adapter: qlora loadin4bit: true lorar: 128 loraalpha: 128 loradropout: 0.1 loratargetlinear: true loramodulestosave: # Uncomment only if you added NEW tokens ==================== TRAINING PARAMETERS ==================== numepochs: 3 microbatchsize: 4 gradientaccumulationsteps: 1 learningrate: 1e-5 optimizer: pagedadamw8bit lrscheduler: rex warmupratio: 0.05 weightdecay: 0.01 maxgradnorm: 1.0 ==================== SEQUENCE & PACKING ==================== sequencelen: 8192 samplepacking: true padtosequencelen: true ==================== HARDWARE OPTIMIZATIONS ==================== bf16: auto flashattention: true gradientcheckpointing: offload deepspeed: deepspeedconfigs/zero1.json plugins: - axolotl.integrations.liger.LigerPlugin - axolotl.integrations.cutcrossentropy.CutCrossEntropyPlugin cutcrossentropy: true ligerrope: true ligerrmsnorm: true ligerlayernorm: true ligergluactivation: true ligercrossentropy: false # Cut Cross Entropy overrides this ligerfusedlinearcrossentropy: false # Cut Cross Entropy overrides this ==================== EVALUATION & CHECKPOINTING ==================== savestrategy: steps savesteps: 20 savetotallimit: 5 # Keep best + last few checkpoints loadbestmodelatend: true metricforbestmodel: evalloss greaterisbetter: false ==================== LOGGING & OUTPUT ==================== outputdir: ./Visage-V3-PT-1-SFT-2 loggingsteps: 1 savesafetensors: true ==================== WANDB TRACKING ==================== wandbproject: Visage-V3-SFT wandbentity: yourentity wandbname: Visage-V3-PT-1-SFT-2 DPO 2H200 # ==================== MODEL CONFIGURATION ==================== basemodel: ./Visage-V3-PT-1-SFT-2/merged modeltype: MistralForCausalLM tokenizertype: AutoTokenizer chattemplate: mistralv7tekken ==================== RL/DPO CONFIGURATION ==================== rl: dpo rlbeta: 0.085 ==================== DATASET CONFIGURATION ==================== datasets: - path: ./data/handcrafteddatasetmistralrep.jsonl type: chattemplate.default fieldmessages: messages fieldchosen: chosen fieldrejected: rejected messagepropertymappings: role: role content: content roles: system: ["system"] user: ["user"] assistant: ["assistant"] - path: ./data/approvedautomatedl3dataset.jsonl type: chattemplate.default fieldmessages: messages fieldchosen: chosen fieldrejected: rejected messagepropertymappings: role: role content: content roles: system: ["system"] user: ["user"] assistant: ["assistant"] datasetpreparedpath: trainoninputs: false # Only train on assistant responses ==================== QLORA CONFIGURATION ==================== adapter: lora loadin8bit: true lorar: 16 loraalpha: 32 loradropout: 0.1 loratargetlinear: true loramodulestosave: # Uncomment only if you added NEW tokens ==================== TRAINING PARAMETERS ==================== numepochs: 1 microbatchsize: 2 gradientaccumulationsteps: 4 learningrate: 2e-6 optimizer: adamwtorchfused lrscheduler: cosine warmupsteps: 5 weightdecay: 0.01 maxgradnorm: 1.0 ==================== SEQUENCE CONFIGURATION ==================== sequencelen: 8192 padtosequencelen: true ==================== HARDWARE OPTIMIZATIONS ==================== bf16: auto tf32: false flashattention: true gradientcheckpointing: offload plugins: - axolotl.integrations.liger.LigerPlugin - axolotl.integrations.cutcrossentropy.CutCrossEntropyPlugin cutcrossentropy: true ligerrope: true ligerrmsnorm: true ligerlayernorm: true ligergluactivation: true ligercrossentropy: false # Cut Cross Entropy overrides this ligerfusedlinearcrossentropy: false # Cut Cross Entropy overrides this deepspeed: deepspeedconfigs/zero1.json ==================== CHECKPOINTING ==================== savesteps: 10 savetotallimit: 10 loadbestmodelatend: true metricforbestmodel: evalloss greaterisbetter: false ==================== LOGGING & OUTPUT ==================== outputdir: ./Visage-V3-PT-1-SFT-2-DPO-2 loggingsteps: 1 savesafetensors: true ==================== WANDB TRACKING ==================== wandbproject: Visage-V3-DPO wandbentity: yourentity wandbname: Visage-V3-PT-1-SFT-2-DPO-2

NaNK

—

128

MS3.2-PaintedFantasy-v4-24B

L3.3-GeneticLemonade-Final-v2-70B

body { font-family: sans-serif; color: #f0f0f0; line-height: 1.6; margin: 0; padding: 0; background-color: #1a0f1a; } .lemonade-text { color: #ff3366; position: relative; z-index: 2; margin-left: 0.2em; text-shadow: 0 0 10px #ff3366; } / Section styling / .section-container { background-color: rgba(26, 15, 26, 0.7); margin-bottom: 30px; position: relative; overflow: hidden; border-bottom: 1px solid #ff3366; } .section-header { display: flex; align-items: center; background-color: rgba(255, 51, 102, 0.08); padding: 10px 20px; } .section-indicator { width: 8px; height: 20px; background-color: #ff3366; margin-right: 15px; } .section-title { font-family: 'Orbitron', sans-serif; color: #f0f0f0; font-size: 1.3rem; margin: 0; letter-spacing: 2px; text-transform: uppercase; font-weight: 500; } .section-content { padding: 20px; font-family: sans-serif; color: #f0f0f0; line-height: 1.6; } / Title styling / .title-container { background-color: #0a0a0a; position: relative; overflow: hidden; margin-bottom: 40px; border-left: 3px solid #ff3366; } .title-wrapper { position: relative; z-index: 2; padding: 25px 20px 30px 30px; font-family: 'Orbitron', sans-serif; } .title-main { color: #f0f0f0; font-size: 2.5rem; font-weight: 700; margin: 0; letter-spacing: 2px; display: inline-block; position: relative; text-transform: uppercase; } .title-subtitle { padding-left: 15px; margin-top: 5px; margin-left: 5px; } .subtitle-text { color: #cc0066; font-size: 1.2rem; font-family: 'Orbitron', sans-serif; font-weight: 300; letter-spacing: 3px; text-transform: uppercase; display: inline-block; } .glitchy-overlay { position: absolute; top: 0; left: 0; width: 100%; height: 100%; background-image: repeating-linear-gradient(0deg, rgba(0,0,0,0) 0, rgba(139, 0, 0, 0.1) 1px, rgba(0,0,0,0) 2px); z-index: 1; } / Data box styling / .data-box { background-color: rgba(0, 0, 0, 0.4); padding: 15px; border-left: 2px solid #ff3366; margin-bottom: 20px; } .data-arrow { color: #ff3366; width: 20px; display: inline-block; } .data-label { color: #cc0066; width: 80px; display: inline-block; } / Subheading styling / .subheading { color: #cc0066; font-size: 1.1rem; margin-top: 20px; margin-bottom: 15px; font-weight: 400; border-bottom: 1px dashed rgba(204, 0, 102, 0.4); display: inline-block; text-transform: uppercase; letter-spacing: 1px; font-family: 'Orbitron', sans-serif; } / Links / a { color: #cc0066; text-decoration: none; } a:hover { text-decoration: underline; color: #ff6600; } / Container / .container { max-width: 1200px; margin: 20px auto; padding: 40px 20px; background-color: #0a0a0a; background-image: linear-gradient(rgba(139, 0, 0, 0.12) 1px, transparent 1px), linear-gradient(90deg, rgba(139, 0, 0, 0.12) 1px, transparent 1px); background-size: 20px 20px; min-height: calc(100vh - 40px); border: 1px solid #ff3366; border-radius: 2px; } Wasn't intending to release another model (so soon at least), but I was testing out some new dataset ideas and thought this model came out pretty nice. zerofata/GeneticLemonade-Final SFT QLora finetune. This is an uncensored creative model intended to excel at character driven RP / ERP. This model is designed to provide longer, narrative heavy responses where characters are portrayed accurately and proactively. Compared to Unleashed v3, this model has significantly reduced positivity bias and arguably a nicer writing style. The tradeoff is it swipe heavy, making a few more logical errors and can be a bit too concise at times. Play with these, they are not the 'best' settings just a stable baseline. Recommended Samplers Llama-3-Instruct-Names but you will need to uncheck "System same as user". This model was trained using a dataset of approx 4.3 million tokens, 700 RP conversations, 2000 creative writing / instruct samples and about 400 summaries. The bulk of this data has been made public. This model didn't take well to my existing DPO dataset, so it hasn't been used here. Axolotl configs Not optimized for cost / performance efficiency, YMMV. SFT 1H200

NaNK

llama

L3.3-GeneticLemonade-Unleashed-v3-70B

/ Base styling for cyberpunk theme / body {font-family: sans-serif; background-color: #080c14; color: #e1e9f0; line-height: 1.6; margin: 0; padding: 0;} .lemonade-text { color: #33ff99; position: relative; / Keep relative positioning / z-index: 2; margin-left: 0.2em; text-shadow: 0 0 10px #33ff99; / Add static glow / } / Section styling / .section-container {background-color: rgba(8, 12, 20, 0.7); margin-bottom: 30px; position: relative; overflow: hidden; border-bottom: 1px solid #33ff99;} .section-header {display: flex; align-items: center; background-color: rgba(0, 195, 255, 0.1); padding: 10px 20px;} .section-indicator {width: 8px; height: 20px; background-color: #33ff99; margin-right: 15px;} .section-title {font-family: 'Orbitron', sans-serif; color: #e1e9f0; font-size: 1.3rem; margin: 0; letter-spacing: 2px; text-transform: uppercase; font-weight: 500;} .section-content {padding: 20px; font-family: sans-serif; color: #e1e9f0; line-height: 1.6;} / Title styling / .title-container { background-color: #080c14; position: relative; overflow: hidden; margin-bottom: 40px; border-left: 3px solid #33ff99; } .title-wrapper { position: relative; z-index: 2; padding: 25px 20px 30px 30px; font-family: 'Orbitron', sans-serif; } .title-main { color: #e1e9f0; font-size: 2.5rem; / Reduced font size / font-weight: 700; margin: 0; letter-spacing: 2px; display: inline-block; position: relative; text-transform: uppercase; } .title-subtitle { padding-left: 15px; margin-top: 5px; margin-left: 5px; } .subtitle-text { color: #00c3ff; font-size: 1.2rem; / Reduced font size / font-family: 'Orbitron', sans-serif; font-weight: 300; letter-spacing: 3px; text-transform: uppercase; display: inline-block; } .glitchy-overlay { position: absolute; top: 0; left: 0; width: 100%; height: 100%; background-image: repeating-linear-gradient(0deg, rgba(0,0,0,0) 0, rgba(0,0,0,0.1) 1px, rgba(0,0,0,0) 2px); z-index: 1; } / Data box styling / .data-box {background-color: rgba(0, 0, 0, 0.2); padding: 15px; border-left: 2px solid #33ff99; margin-bottom: 20px;} .data-row {display: flex; margin-bottom: 8px;} .data-arrow {color: #33ff99; width: 20px; display: inline-block;} .data-label {color: #00c3ff; width: 80px; display: inline-block;} / Subheading styling / .subheading {color: #00c3ff; font-size: 1.1rem; margin-top: 20px; margin-bottom: 15px; font-weight: 400; border-bottom: 1px dashed rgba(0, 195, 255, 0.3); display: inline-block; text-transform: uppercase; letter-spacing: 1px; font-family: 'Orbitron', sans-serif;} / Links / a {color: #00c3ff; text-decoration: none;} a:hover {text-decoration: underline;} / Container / .container {max-width: 1200px; margin: 0 auto; padding: 40px 20px;} / Cyberpunk grid background / .cyber-grid-bg {position: fixed; top: 0; left: 0; right: 0; bottom: 0; background-color: #05071b; background-image: linear-gradient(rgba(0, 194, 255, 0.03) 1px, transparent 1px), linear-gradient(90deg, rgba(0, 194, 255, 0.03) 1px, transparent 1px); background-size: 20px 20px; z-index: -1;} An experimental release. zerofata/GeneticLemonade-Unleashed SFT+DPO QLora finetune. This is a creative model intended to excel at character driven RP / ERP. It has not been tested or trained on adventure stories or any large amounts of creative writing. This model is designed to provide longer, narrative heavy responses where characters are portrayed accurately and proactively. Play with these, they are not the 'best' settings just a stable baseline. Something interesting to note is this model supports higher temps than would normally be recommended for other L3 models. Recommended Samplers Llama-3-Instruct-Names but you will need to uncheck "System same as user". The model first went through SFT with a small synthetic dataset of 2.9 million tokens, approximately 750 conversations. Primarily RP data with small amounts of random instruct / assistant data and creative writing. The model then went through DPO training using approx 1100 chosen examples from the SFT dataset that were of exceptional quality or showed verifiable instruction following. Rejected samples were generated using another Llama 3.3 finetune that is known for poor instruction following. Axolotl configs Neither are optimized for cost / performance efficiency, YMMV. SFT 1H200

NaNK

llama

MS3.2-PaintedFantasy-24B

body { font-family: sans-serif; color: #e8f4f8; line-height: 1.6; margin: 0; padding: 0; background-color: #0a1628; } .lemonade-text { color: #4fc3f7; position: relative; z-index: 2; margin-left: 0.2em; text-shadow: 0 0 15px #4fc3f7; } / Section styling / .section-container { background-color: rgba(10, 22, 40, 0.8); margin-bottom: 30px; position: relative; overflow: hidden; border-bottom: 1px solid #4fc3f7; box-shadow: 0 4px 15px rgba(79, 195, 247, 0.1); } .section-header { display: flex; align-items: center; background-color: rgba(79, 195, 247, 0.06); padding: 10px 20px; } .section-indicator { width: 8px; height: 20px; background-color: #4fc3f7; margin-right: 15px; box-shadow: 0 0 8px rgba(79, 195, 247, 0.4); } .section-title { font-family: 'Georgia', 'Times New Roman', serif; color: #e8f4f8; font-size: 1.4rem; margin: 0; letter-spacing: 1px; font-weight: 400; text-transform: capitalize; } .section-content { padding: 20px; font-family: sans-serif; color: #e8f4f8; line-height: 1.6; } / Title styling / .title-container { background-color: #051017; position: relative; overflow: hidden; margin-bottom: 40px; border-left: 3px solid #4fc3f7; box-shadow: 0 6px 20px rgba(79, 195, 247, 0.15); } .title-wrapper { position: relative; z-index: 2; padding: 25px 20px 30px 30px; font-family: 'Georgia', 'Times New Roman', serif; } .title-main { color: #e8f4f8; font-size: 2.5rem; font-weight: 700; margin: 0; letter-spacing: 2px; display: inline-block; position: relative; text-transform: uppercase; } .title-subtitle { padding-left: 15px; margin-top: 5px; margin-left: 5px; } .subtitle-text { color: #b39ddb; font-size: 1.2rem; font-family: 'Georgia', 'Times New Roman', serif; font-weight: 300; letter-spacing: 3px; text-transform: uppercase; display: inline-block; } .glitchy-overlay { position: absolute; top: 0; left: 0; width: 100%; height: 100%; background-image: repeating-linear-gradient(0deg, rgba(0,0,0,0) 0, rgba(79, 195, 247, 0.08) 1px, rgba(0,0,0,0) 2px); z-index: 1; } / Data box styling / .data-box { background-color: rgba(5, 16, 23, 0.6); padding: 15px; border-left: 2px solid #4fc3f7; margin-bottom: 20px; box-shadow: 0 2px 10px rgba(79, 195, 247, 0.1); } .data-arrow { color: #4fc3f7; width: 20px; display: inline-block; } .data-label { color: #b39ddb; width: 80px; display: inline-block; } / Subheading styling / .subheading { color: #b39ddb; font-size: 1.1rem; margin-top: 20px; margin-bottom: 15px; font-weight: 400; border-bottom: 1px dashed rgba(179, 157, 219, 0.4); display: inline-block; text-transform: uppercase; letter-spacing: 1px; font-family: 'Georgia', 'Times New Roman', serif; } / Links / a { color: #b39ddb; text-decoration: none; } a:hover { text-decoration: underline; color: #f8bbd9; } / Container / .container { max-width: 1200px; margin: 20px auto; padding: 40px 20px; background-color: #051017; background-image: radial-gradient(circle at 20% 80%, rgba(79, 195, 247, 0.03) 0%, transparent 50%), radial-gradient(circle at 80% 20%, rgba(179, 157, 219, 0.03) 0%, transparent 50%), radial-gradient(circle at 40% 40%, rgba(248, 187, 217, 0.02) 0%, transparent 50%); min-height: calc(100vh - 40px); border: 1px solid #4fc3f7; border-radius: 8px; box-shadow: 0 8px 32px rgba(79, 195, 247, 0.15); } / Dropdown styling / .dropdown-container { margin-top: 20px; } .dropdown-summary { cursor: pointer; padding: 10px 0; border-bottom: 1px dashed rgba(179, 157, 219, 0.4); color: #b39ddb; font-size: 1.1rem; font-weight: 400; text-transform: uppercase; letter-spacing: 1px; font-family: 'Georgia', 'Times New Roman', serif; list-style: none; display: flex; align-items: center; } .dropdown-summary::-webkit-details-marker { display: none; } .dropdown-arrow { color: #4fc3f7; margin-right: 10px; transition: transform 0.3s ease; } .dropdown-container[open] .dropdown-arrow { transform: rotate(90deg); } .dropdown-content { margin-top: 15px; padding: 15px; background-color: rgba(5, 16, 23, 0.6); border-left: 2px solid #4fc3f7; box-shadow: 0 2px 10px rgba(79, 195, 247, 0.1); } .config-title { color: #4fc3f7; font-size: 1rem; margin-bottom: 10px; font-family: 'Georgia', 'Times New Roman', serif; text-transform: uppercase; letter-spacing: 1px; } Experimental release. This is an uncensored creative model intended to excel at character driven RP / ERP. This model is designed to provide longer, narrative heavy responses where characters are portrayed accurately and proactively. Training process: Pretrain > SFT > DPO > DPO 2 Did a small pretrain on some light novels and Frieren wiki data as a test. Hasn't seemed to hurt the model and model has shown some small improvements in the lore of series that were included. The model then went through the standard SFT using a dataset of approx 3.6 million tokens, 700 RP conversations, 1000 creative writing / instruct samples and about 100 summaries. The bulk of this data has been made public. Finally DPO was used to make the model a little more consistent. The first stage of DPO focused on instruction following and the second tried to burn out some Mistral-isms. Not optimized for cost / performance efficiency, YMMV. SFT 1H100 # ==================== # MODEL CONFIGURATION # ==================== basemodel: ./MS3-2-Pretrain/merged modeltype: AutoModelForCausalLM tokenizertype: AutoTokenizer # ==================== # DATASET CONFIGURATION # ==================== datasets: - path: ./dataset.jsonl type: chattemplate split: train chattemplatestrategy: tokenizer fieldmessages: messages messagepropertymappings: role: role content: content roles: user: ["user"] assistant: ["assistant"] system: ["system"] datasetpreparedpath: trainoninputs: false # Only train on assistant responses # ==================== # QLORA CONFIGURATION # ==================== adapter: qlora loadin4bit: true lorar: 128 loraalpha: 128 loradropout: 0.1 loratargetlinear: true # loramodulestosave: # Uncomment only if you added NEW tokens # ==================== # TRAINING PARAMETERS # ==================== numepochs: 3 microbatchsize: 4 gradientaccumulationsteps: 2 learningrate: 1e-5 optimizer: pagedadamw8bit lrscheduler: rex warmupratio: 0.05 weightdecay: 0.01 maxgradnorm: 1.0 # ==================== # SEQUENCE & PACKING # ==================== sequencelen: 8192 samplepacking: true evalsamplepacking: false padtosequencelen: true # ==================== # HARDWARE OPTIMIZATIONS # ==================== bf16: auto flashattention: true gradientcheckpointing: true # ==================== # EVALUATION & CHECKPOINTING # ==================== savestrategy: steps savesteps: 5 savetotallimit: 5 # Keep best + last few checkpoints loadbestmodelatend: true greaterisbetter: false # ==================== # LOGGING & OUTPUT # ==================== outputdir: ./MS3-2-SFT-2 loggingsteps: 2 savesafetensors: true # ==================== # WANDB TRACKING # ==================== wandbproject: MS3-2-SFT wandbentity: yourentity wandbname: runname

NaNK

license:apache-2.0

L3.3 GeneticLemonade Unleashed 70B

NaNK

llama

GLM-4.5-Iceblink-v3-106B-A12B

NaNK

license:mit

MS3.2-PaintedFantasy-v3-24B-exl3-6bpw

NaNK

license:apache-2.0

GLM-4.5-Iceblink-v2-106B-A12B

.container { --primary-accent: #87CEEB; --secondary-accent: #B0E5F5; --tertiary-accent: #5FA8D3; --ice-accent: #E0F4FF; --silver-accent: #C8D8E4; --glow-primary: rgba(135, 206, 235, 0.6); --glow-secondary: rgba(176, 229, 245, 0.7); --bg-main: #0a1628; --bg-container: #0f1e35; --bg-card: rgba(15, 30, 53, 0.95); --bg-elevated: #162840; --text-main: #E8F4F8; --text-muted: #9BC4E2; --text-bright: #FFFFFF; --white: #FFFFFF; --border-color: #2B4F76; --border-ice: #B0E5F5; --font-title: 'Inter', sans-serif; --font-body: 'Source Sans Pro', sans-serif; --font-code: 'JetBrains Mono', monospace; font-family: var(--font-body); color: var(--text-main); line-height: 1.6; font-weight: 400; max-width: 1100px; margin: 20px auto; padding: 60px; background: linear-gradient(135deg, #0a1628 0%, #0f1e35 50%, #0a1628 100%); min-height: calc(100vh - 40px); position: relative; border: 1px solid var(--border-ice); box-shadow: 0 0 0 3px var(--border-color), 0 0 0 5px var(--border-ice), 0 0 0 8px var(--border-color), 0 0 60px rgba(135, 206, 235, 0.4), inset 0 0 100px rgba(135, 206, 235, 0.15); } .container .title-container { background: linear-gradient(135deg, var(--bg-elevated), var(--bg-card)); margin-bottom: 50px; border: 2px solid var(--border-ice); padding: 50px; text-align: center; position: relative; box-shadow: 0 0 0 1px var(--border-color), 0 0 0 4px var(--border-ice), 0 0 0 6px var(--border-color), 0 0 40px var(--glow-primary), inset 0 0 60px rgba(135, 206, 235, 0.2); overflow: visible; } .container .title-container::before { content: ''; position: absolute; top: 0; left: 0; right: 0; height: 3px; background: linear-gradient(90deg, transparent, var(--ice-accent), transparent); box-shadow: 0 0 10px var(--ice-accent); } .container .title-container::after { content: ''; position: absolute; bottom: 0; left: 0; right: 0; height: 3px; background: linear-gradient(90deg, transparent, var(--ice-accent), transparent); box-shadow: 0 0 10px var(--ice-accent); } .container .title-container .title-wrapper { position: relative; z-index: 2; } .container .title-main { color: var(--text-bright); font-size: 3rem; font-weight: 900; margin: 0; letter-spacing: 4px; display: block; text-transform: uppercase; background: linear-gradient(90deg, var(--ice-accent), var(--text-bright), var(--ice-accent)); background-clip: text; -webkit-background-clip: text; -webkit-text-fill-color: transparent; font-family: var(--font-title); text-shadow: 0 0 30px var(--ice-accent), 0 0 60px rgba(176, 229, 245, 0.5), 0 4px 8px rgba(135, 206, 235, 0.6); position: relative; } .container .lemonade-text { background: linear-gradient(135deg, var(--silver-accent), var(--ice-accent)); background-clip: text; -webkit-background-clip: text; -webkit-text-fill-color: transparent; } .container .version-indicator { color: var(--text-muted); font-size: 0.85rem; font-weight: 600; letter-spacing: 3px; margin-top: 15px; text-transform: uppercase; font-family: var(--font-title); opacity: 0.7; } .container .title-subtitle { padding: 20px; margin-top: 25px; border: 1px solid var(--border-ice); box-shadow: 0 0 20px rgba(135, 206, 235, 0.3); } .container .subtitle-text { color: var(--text-muted); font-size: 1.3rem; font-family: var(--font-body); font-style: italic; font-weight: 400; letter-spacing: 3px; text-transform: uppercase; } .container img { max-width: 100%; border: 3px solid var(--border-ice); margin-bottom: 40px; box-shadow: 0 0 0 1px var(--border-color), 0 0 0 5px var(--border-ice), 0 12px 24px rgba(135, 206, 235, 0.3); } .container .section-container { margin-bottom: 40px; padding: 40px; background: linear-gradient(135deg, var(--bg-card), var(--bg-elevated)); border: 2px solid var(--border-ice); box-shadow: 0 0 0 1px var(--border-color), 0 0 0 5px var(--border-ice), 0 8px 24px rgba(135, 206, 235, 0.3), inset 0 0 40px rgba(135, 206, 235, 0.1); } .container .section-container:last-of-type { margin-bottom: 0; } .container .section-header { display: flex; align-items: center; padding: 20px; border: 1px solid var(--border-ice); margin-bottom: 30px; background: rgba(43, 79, 118, 0.2); box-shadow: 0 0 20px rgba(135, 206, 235, 0.2); } .container .section-title { font-family: var(--font-title); background: linear-gradient(90deg, var(--ice-accent), var(--text-bright), var(--ice-accent)); background-clip: text; -webkit-background-clip: text; -webkit-text-fill-color: transparent; font-size: 1.8rem; margin: 0 !important; padding: 0 !important; letter-spacing: 4px; font-weight: 800; text-transform: uppercase; border: none !important; display: inline-block; text-shadow: 0 0 20px var(--ice-accent); } .container .subheading { color: var(--text-bright); font-size: 1.4rem; margin-top: 30px; margin-bottom: 20px; font-weight: 700; display: block; text-transform: uppercase; letter-spacing: 3px; font-family: var(--font-title); border-bottom: 2px solid var(--border-ice); padding-bottom: 12px; text-shadow: 0 0 15px var(--ice-accent); } .container .data-box { background: linear-gradient(135deg, var(--bg-card), rgba(22, 40, 64, 0.8)); padding: 25px; border: 2px solid var(--border-ice); border-left: 5px solid var(--primary-accent); margin-bottom: 25px; box-shadow: 0 0 20px rgba(135, 206, 235, 0.3), inset 0 0 20px rgba(135, 206, 235, 0.1); font-size: 1rem; } .container .data-row { display: flex; align-items: center; margin-bottom: 12px; padding: 10px 0; border-bottom: 1px solid rgba(176, 229, 245, 0.2); } .container .data-row:last-child { margin-bottom: 0; } .container .data-arrow { color: var(--ice-accent); font-weight: bold; margin-right: 15px; font-family: var(--font-code); font-size: 1.2rem; text-shadow: 0 0 10px var(--ice-accent); } .container .data-label { color: var(--text-muted); font-weight: 700; font-family: var(--font-body); margin-right: 15px; min-width: 120px; text-transform: uppercase; letter-spacing: 1px; } .container a { color: var(--text-bright); text-decoration: none; font-weight: 600; transition: all .2s; } .container .data-row a { border-bottom: 1px dotted var(--ice-accent); } .container a:hover { color: var(--ice-accent); text-shadow: 0 0 10px var(--ice-accent); } .container .data-row a:hover { border-bottom-style: solid; } .container .dropdown-container { margin-top: 30px; } .container .dropdown-summary { cursor: pointer; padding: 15px 20px; color: var(--text-muted); font-size: 1.2rem; font-weight: 700; text-transform: uppercase; font-family: var(--font-title); letter-spacing: 2px; list-style: none; transition: all 0.2s ease; border: 1px solid var(--border-ice); background: rgba(43, 79, 118, 0.2); box-shadow: 0 0 15px rgba(135, 206, 235, 0.2); } .container .dropdown-summary:hover { color: var(--ice-accent); background: rgba(43, 79, 118, 0.3); box-shadow: 0 0 25px rgba(135, 206, 235, 0.3); } .container .dropdown-summary::-webkit-details-marker { display: none; } .container .dropdown-arrow { color: var(--ice-accent); margin-right: 15px; transition: transform 0.2s ease; text-shadow: 0 0 10px var(--ice-accent); } .container details[open] .dropdown-arrow { transform: rotate(90deg); } .container .dropdown-content { margin-top: 20px; padding: 20px 15px; background: linear-gradient(135deg, var(--bg-card), rgba(22, 40, 64, 0.9)); border: 2px solid var(--border-ice); box-shadow: 0 0 20px rgba(135, 206, 235, 0.3), inset 0 0 30px rgba(135, 206, 235, 0.1); } .container .config-title { color: var(--text-bright); font-size: 1.1rem; margin-bottom: 10px; font-family: var(--font-body); text-transform: uppercase; letter-spacing: 2px; font-weight: 700; text-shadow: 0 0 10px var(--ice-accent); } .container pre { background: #050a14; padding: 8px 16px; margin: 0; border: 2px solid var(--border-ice); white-space: pre; overflow-x: auto; color: var(--text-main); box-shadow: 0 0 20px rgba(135, 206, 235, 0.2), inset 0 0 20px rgba(135, 206, 235, 0.15); } .container pre code { background: none; color: inherit; padding: 0; margin: 0; display: block; border: none; outline: none; } .container code { font-family: var(--font-code); color: var(--ice-accent); background: rgba(176, 229, 245, 0.15); padding: 4px 8px; border: 1px solid rgba(135, 206, 235, 0.3); } Another re-attempt at GLM 4.5 Air. This time using a different training framework, some updated data and better hyperparameters. This model is a creative writing and RP model. It's pretty verbose. The intent is to keep the behavior of the original model, but to improve writing, dialogue & creativity. Compared to the original Iceblink, the effect on this one is more pronounced, with hopefully minimal impact on the intelligence. Creation Process: SFT SFT on approx 13 million tokens, SFW / NSFW RP, stories, creative instruct & chat data. Some of the SFW datasets are public and can be found in the model datasets list. I've switched over from Axolotl to MS-Swift w/ Megatron to train MoE models now. There's a roughly 5-10x speedup in training the models, thanks to escaping the naive MoE implementation in TRL. The training time for this run took only 40 minutes, excluding environment setup time. A low LR for GLM Air appears to be king. Going any higher, I've found it extremely easy to begin overcooking the model. Not optimized for cost / performance efficiency, YMMV. SFT (8H200) PYTORCHCUDAALLOCCONF='expandablesegments:True' \ NPROCPERNODE=8 \ WANDBAPIKEY=wandbkey \ CUDAVISIBLEDEVICES=0,1,2,3,4,5,6,7 \ megatron sft \ --load '/workspace/glm-4.5-air-mcore' \ --dataset '/workspace/joineddatasetcleanedmodified.jsonl' \ --loadfromcachefile true \ --traintype lora \ --lorarank 256 \ --loraalpha 16 \ --use-rslora true \ --targetmodules all-linear \ --splitdatasetratio 0.01 \ --moepermutefusion true \ --tensormodelparallelsize 8 \ --experttensorparallelsize 1 \ --expertmodelparallelsize 8 \ --moegroupedgemm true \ --moesharedexpertoverlap true \ --moeauxlosscoeff 6e-5 \ --microbatchsize 4 \ --globalbatchsize 32 \ --recomputegranularity full \ --recomputemethod uniform \ --recomputenumlayers 1 \ --maxepochs 2 \ --crossentropylossfusion true \ --lr 6e-6 \ --lrwarmupfraction 0.05 \ --minlr 6e-7 \ --save megatronoutput/Iceblink-v3-SFT-3 \ --evalinterval 20 \ --saveinterval 25 \ --finetune true \ --packing true \ --maxlength 10280 \ --numworkers 8 \ --datasetnumproc 8 \ --nosaveoptim true \ --nosaverng true \ --sequenceparallel true \ --wandbproject Megatron-Air-SFT \ --wandbexpname Iceblink-v3-SFT-3 \ --attentionbackend flash A shoutout to the people in BeaverAI discord that helped me test this model and my intermediate versions. ddh0 (Madison), Ambius, Dysfunctional & my dude.

NaNK

license:mit

MS3.2-PaintedFantasy-Visage-v4-34b-exl3-6bpw

license:apache-2.0

MS3.2-PaintedFantasy-Visage-33B

MS3.2 PaintedFantasy Visage V3 34B Exl3 6bpw

NaNK

—

L3.3-Genetic-Lemonade-Sunset-70B-4.5bpw-hb6-exl2

NaNK

llama

L3.3-GeneticLemonade-Unleashed-v2-70b_6bpw-hb8-exl2

/ Base styling for cyberpunk theme / body {font-family: sans-serif; background-color: #080c14; color: #e1e9f0; line-height: 1.6; margin: 0; padding: 0;} / Animation classes / / Remove flicker-text rules / / New static style for LEMONADE / .lemonade-text { color: #33ff99; position: relative; / Keep relative positioning / z-index: 2; margin-left: 0.2em; text-shadow: 0 0 10px #33ff99; / Add static glow / } / Section styling / .section-container {background-color: rgba(8, 12, 20, 0.7); margin-bottom: 30px; position: relative; overflow: hidden; border-bottom: 1px solid #33ff99;} .section-header {display: flex; align-items: center; background-color: rgba(0, 195, 255, 0.1); padding: 10px 20px;} .section-indicator {width: 8px; height: 20px; background-color: #33ff99; margin-right: 15px;} .section-title {font-family: 'Orbitron', sans-serif; color: #e1e9f0; font-size: 1.3rem; margin: 0; letter-spacing: 2px; text-transform: uppercase; font-weight: 500;} .section-content {padding: 20px; font-family: sans-serif; color: #e1e9f0; line-height: 1.6;} / Title styling / .title-container { background-color: #080c14; position: relative; overflow: hidden; margin-bottom: 40px; border-left: 3px solid #33ff99; } .title-wrapper { position: relative; z-index: 2; padding: 25px 20px 30px 30px; font-family: 'Orbitron', sans-serif; } .title-main { color: #e1e9f0; font-size: 2.5rem; / Reduced font size / font-weight: 700; margin: 0; letter-spacing: 2px; display: inline-block; position: relative; text-transform: uppercase; } .title-subtitle { padding-left: 15px; margin-top: 5px; margin-left: 5px; } .subtitle-text { color: #00c3ff; font-size: 1.2rem; / Reduced font size / font-family: 'Orbitron', sans-serif; font-weight: 300; letter-spacing: 3px; text-transform: uppercase; display: inline-block; } .glitchy-overlay { position: absolute; top: 0; left: 0; width: 100%; height: 100%; background-image: repeating-linear-gradient(0deg, rgba(0,0,0,0) 0, rgba(0,0,0,0.1) 1px, rgba(0,0,0,0) 2px); z-index: 1; } / Data box styling / .data-box {background-color: rgba(0, 0, 0, 0.2); padding: 15px; border-left: 2px solid #33ff99; margin-bottom: 20px;} .data-row {display: flex; margin-bottom: 8px;} .data-arrow {color: #33ff99; width: 20px; display: inline-block;} .data-label {color: #00c3ff; width: 80px; display: inline-block;} / Subheading styling / .subheading {color: #00c3ff; font-size: 1.1rem; margin-top: 20px; margin-bottom: 15px; font-weight: 400; border-bottom: 1px dashed rgba(0, 195, 255, 0.3); display: inline-block; text-transform: uppercase; letter-spacing: 1px; font-family: 'Orbitron', sans-serif;} / Links / a {color: #00c3ff; text-decoration: none;} a:hover {text-decoration: underline;} / Container / .container {max-width: 1200px; margin: 0 auto; padding: 40px 20px;} / Cyberpunk grid background / .cyber-grid-bg {position: fixed; top: 0; left: 0; right: 0; bottom: 0; background-color: #05071b; background-image: linear-gradient(rgba(0, 194, 255, 0.03) 1px, transparent 1px), linear-gradient(90deg, rgba(0, 194, 255, 0.03) 1px, transparent 1px); background-size: 20px 20px; z-index: -1;} An experimental release. zerofata/GeneticLemonade-Unleashed qlora trained on a test dataset. Performance is improved from the original in my testing, but there are possibly (likely?) areas where the model will underperform which I am looking for feedback on. This is a creative model intended to excel at character driven RP / ERP. It has not been tested or trained on adventure stories or any large amounts of creative writing. Play with these, they are not the 'best' settings just a stable baseline. Recommended Samplers Llama-3-Instruct-Names but you will need to uncheck "System same as user". Model was trained on a tiny synthetic dataset of 450k tokens, approximately 130 conversations. Data was generated by script and then manually reviewed / edited. The dataset is approximately 60% SFW and 40% NSFW. 90% multi turn RP conversations, 5% creative writing and 5% miscellaneous. It is an experiment to see how models perform when provided with small amounts of high quality synthetic data, as opposed to human data.

L3.3-GeneticLemonade-Unleashed-v3-70B_4.5bpw-hb6-exl2

NaNK

llama

L3.3-GeneticLemonade-Unleashed-v3-70B_6bpw-hb8-exl2

NaNK

llama

L3.3-GeneticLemonade-Final-v2-70B_4.5bpw-hb6-exl2

NaNK

llama

mithril-llama-70b-exl3-4.25bpw

NaNK

llama

L3.3-GeneticLemonade-Unleashed-v2.1-70B

/ Base styling for cyberpunk theme / body {font-family: sans-serif; background-color: #080c14; color: #e1e9f0; line-height: 1.6; margin: 0; padding: 0;} / Animation classes / / Remove flicker-text rules / / New static style for LEMONADE / .lemonade-text { color: #33ff99; position: relative; / Keep relative positioning / z-index: 2; margin-left: 0.2em; text-shadow: 0 0 10px #33ff99; / Add static glow / } / Section styling / .section-container {background-color: rgba(8, 12, 20, 0.7); margin-bottom: 30px; position: relative; overflow: hidden; border-bottom: 1px solid #33ff99;} .section-header {display: flex; align-items: center; background-color: rgba(0, 195, 255, 0.1); padding: 10px 20px;} .section-indicator {width: 8px; height: 20px; background-color: #33ff99; margin-right: 15px;} .section-title {font-family: 'Orbitron', sans-serif; color: #e1e9f0; font-size: 1.3rem; margin: 0; letter-spacing: 2px; text-transform: uppercase; font-weight: 500;} .section-content {padding: 20px; font-family: sans-serif; color: #e1e9f0; line-height: 1.6;} / Title styling / .title-container { background-color: #080c14; position: relative; overflow: hidden; margin-bottom: 40px; border-left: 3px solid #33ff99; } .title-wrapper { position: relative; z-index: 2; padding: 25px 20px 30px 30px; font-family: 'Orbitron', sans-serif; } .title-main { color: #e1e9f0; font-size: 2.5rem; / Reduced font size / font-weight: 700; margin: 0; letter-spacing: 2px; display: inline-block; position: relative; text-transform: uppercase; } .title-subtitle { padding-left: 15px; margin-top: 5px; margin-left: 5px; } .subtitle-text { color: #00c3ff; font-size: 1.2rem; / Reduced font size / font-family: 'Orbitron', sans-serif; font-weight: 300; letter-spacing: 3px; text-transform: uppercase; display: inline-block; } .glitchy-overlay { position: absolute; top: 0; left: 0; width: 100%; height: 100%; background-image: repeating-linear-gradient(0deg, rgba(0,0,0,0) 0, rgba(0,0,0,0.1) 1px, rgba(0,0,0,0) 2px); z-index: 1; } / Data box styling / .data-box {background-color: rgba(0, 0, 0, 0.2); padding: 15px; border-left: 2px solid #33ff99; margin-bottom: 20px;} .data-row {display: flex; margin-bottom: 8px;} .data-arrow {color: #33ff99; width: 20px; display: inline-block;} .data-label {color: #00c3ff; width: 80px; display: inline-block;} / Subheading styling / .subheading {color: #00c3ff; font-size: 1.1rem; margin-top: 20px; margin-bottom: 15px; font-weight: 400; border-bottom: 1px dashed rgba(0, 195, 255, 0.3); display: inline-block; text-transform: uppercase; letter-spacing: 1px; font-family: 'Orbitron', sans-serif;} / Links / a {color: #00c3ff; text-decoration: none;} a:hover {text-decoration: underline;} / Container / .container {max-width: 1200px; margin: 0 auto; padding: 40px 20px;} / Cyberpunk grid background / .cyber-grid-bg {position: fixed; top: 0; left: 0; right: 0; bottom: 0; background-color: #05071b; background-image: linear-gradient(rgba(0, 194, 255, 0.03) 1px, transparent 1px), linear-gradient(90deg, rgba(0, 194, 255, 0.03) 1px, transparent 1px); background-size: 20px 20px; z-index: -1;} An experimental release. zerofata/GeneticLemonade-Unleashed qlora trained on a test dataset. Performance is improved from the original in my testing, but there are possibly (likely?) areas where the model will underperform which I am looking for feedback on. This is a creative model intended to excel at character driven RP / ERP. It has not been tested or trained on adventure stories or any large amounts of creative writing. Play with these, they are not the 'best' settings just a stable baseline. Recommended Samplers Llama-3-Instruct-Names but you will need to uncheck "System same as user". Model was trained on a tiny synthetic dataset of 640k tokens, approximately 190 conversations. Data was generated by script and then manually reviewed / edited. The dataset is approximately 60% SFW and 40% NSFW. 90% multi turn RP conversations, 5% creative writing and 5% miscellaneous. It is an experiment to see how models perform when provided with small amounts of high quality synthetic data, as opposed to human data.

NaNK

llama

Llama-3.3-70B-Vulpecula-r1-4.5bpw-hb6-exl2

NaNK

llama

L3.3-GeneticLemonade-Unleashed-v2-70B

NaNK

llama

zerofata

MS3.2-PaintedFantasy-v4.1-24B-GGUF

MS3.2-PaintedFantasy-v4.124B-GGUF

Q3.5-BlueStar-v2-27B-GGUF

MS3.2-PaintedFantasy-v2-24B

L3.3 GeneticLemonade Final 70B

GLM-4.5-Iceblink-v3-106B-A12B-GGUF

MS3.2 PaintedFantasy Visage V3 34B

MS3.2-PaintedFantasy-v4-24B

MS3.2 PaintedFantasy Visage V4 34B

GLM 4.5 Iceblink 106B A12B

L3.3-GeneticLemonade-Opus-70B

MS3.2-PaintedFantasy-v3-24B

L3.3-GeneticLemonade-Final-v2-70B

L3.3-GeneticLemonade-Unleashed-v3-70B

MS3.2-PaintedFantasy-24B

L3.3 GeneticLemonade Unleashed 70B

GLM-4.5-Iceblink-v3-106B-A12B

MS3.2-PaintedFantasy-v3-24B-exl3-6bpw

GLM-4.5-Iceblink-v2-106B-A12B

MS3.2-PaintedFantasy-Visage-v4-34b-exl3-6bpw

MS3.2-PaintedFantasy-v3-24B-exl3-4bpw

MS3.2-PaintedFantasy-v3-24B-exl3-5bpw

llama-3.3-70b-joyous-exl3-4.25bpw

Q3.5-BlueStar-v2-27B

L3.3-Cu-Mai-R1-70b-4.5bpw-hb6-exl2

MS3.2-PaintedFantasy-Visage-33B_exl3_6bpw

MS3.2-PaintedFantasy-v3-24B-exl3-3.5bpw

Q3.5-BlueStar-27B

MS3.2-PaintedFantasy-Visage-v4-34b-exl3-4bpw

MS3.2-PaintedFantasy-v4.1-24B

MS3.2-PaintedFantasy-v2-24b-exl3-4bpw

MS3.2-PaintedFantasy-Visage-v4-34b-exl3-5bpw

MS3.2-PaintedFantasy-v2-24b-exl3-3bpw

MS3.2-PaintedFantasy-Visage-v2-33B-exl3-4bpw

MS3.2-PaintedFantasy-Visage-v3-34B-exl3-4bpw

L3.3-GeneticLemonade-Unleashed-70B-4.5bpw-h6-exl2

MS3.2-PaintedFantasy-Visage-33B_exl3_4bpw

MS3.2-PaintedFantasy-Visage-33B_exl3_5bpw

MS3.2-PaintedFantasy-v2-24b-exl3-3.5bpw

MS3.2-PaintedFantasy-Visage-v2-33B-exl3-6bpw

MS3.2-PaintedFantasy-Visage-33B

MS3.2-PaintedFantasy-v2-24b-exl3-6bpw

MS3.2-PaintedFantasy-Visage-v2-33B-exl3-3bpw

MS3.2-PaintedFantasy-Visage-33B_exl3_3bpw

L3.3-GeneticLemonade-Opus-70B_exl3-4.25bpw

nomad-llama-70b-4.25bpw-exl3

MS3.2-PaintedFantasy-v2-24b-exl3-5bpw

MS3.2-PaintedFantasy-Visage-v4-34b-exl3-3bpw

L3.3-GeneticLemonade-Unleashed-70B-6bpw-h8-exl2

MS3.2-PaintedFantasy-24B_exl3-5bpw

edens-fall-l3.3-70b-0.3c-exl3-4.25bpw

MS3.2-PaintedFantasy-Visage-v2-33B-exl3-5bpw

MS3.2 PaintedFantasy Visage V3 34B Exl3 5bpw

L3.3-GeneticLemonade-Unleashed-v2.1-70B-4.5bpw-hb6-exl2

MS3.2-PaintedFantasy-24B_exl3-3bpw

tesseract-v2.0-llama-70b_exl3-4.25bpw

MS3.2-PaintedFantasy-Visage-v3-34B-exl3-3bpw

MS3.2-PaintedFantasy-Visage-v2-33B

MS3.2 PaintedFantasy Visage V3 34B Exl3 6bpw

L3.3-Genetic-Lemonade-Sunset-70B-4.5bpw-hb6-exl2

L3.3-GeneticLemonade-Unleashed-v2-70b_6bpw-hb8-exl2

L3.3-GeneticLemonade-Final-v2-70B_4.65bpw-hb6-exl2

Tesseract-V0.2-Llama-70b_exl3-4.5bpw

Tesseract-V0.2-Llama-70b_exl3-4.25bpw

MS3.2-PaintedFantasy-24B_exl3-6bpw

Austral-70b-Winton_exl3-4.25bpw

MS3.2-PaintedFantasy-24B_exl3-4bpw

MS3.2-PaintedFantasy-Visage-v3-34B-exl3-4.25bpw

L3.3-GeneticLemonade-Final-70B-6bpw-h8-exl2

L3.3-Genetic-Lemonade-Sunset-70B

L3.3-GeneticLemonade-Unleashed-v2-70B-4.5bpw-hb6-exl2

L3.3-GeneticLemonade-Unleashed-v2.1-70B-4bpw-hb6-exl2

L3.3-GeneticLemonade-Unleashed-v3-70B_4.5bpw-hb6-exl2

L3.3-GeneticLemonade-Unleashed-v3-70B_6bpw-hb8-exl2

L3.3-GeneticLemonade-Final-v2-70B_4.5bpw-hb6-exl2

mithril-llama-70b-exl3-4.25bpw

L3.3-GeneticLemonade-Unleashed-v2.1-70B

Llama-3.3-70B-Vulpecula-r1-4.5bpw-hb6-exl2

L3.3-GeneticLemonade-Unleashed-v2-70B