初始化项目，由ModelHub XC社区提供模型

Model: pthinc/cicikus_classic Source: Original Platform
2026-06-03 17:07:17 +08:00
commit 1065045a9b
19 changed files with 551100 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,39 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+gguf/cicikus_classic_fp16.gguf filter=lfs diff=lfs merge=lfs -text
+gguf/cicikus_classic_q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text
+gguf/cicikus_classic_q6_k.gguf filter=lfs diff=lfs merge=lfs -text
+gguf/cicikus_classic_q8_0.gguf filter=lfs diff=lfs merge=lfs -text
--- a/README.md
+++ b/README.md
@@ -0,0 +1,268 @@
+---
+language:
+- en
+- tr
+library_name: transformers
+tags:
+- reasoning
+- gpt2
+- text-generation
+- fine-tune
+- pthinc
+- cicikus
+- instruct
+- bce
+- chat
+- text-generation-inference
+- agent
+- cicikuş
+- cicikus
+- prettybird
+- consciousness
+- conscious
+- llm
+- transformers
+- optimized
+- ethic
+- secure
+- turkish
+- english
+- behavioral-consciousness-engine
+- model
+- reasoning
+- think
+- thinking
+- chain-of-thought
+- STEM-expert
+- turkish & english
+- bce-aci
+- onnx
+- gguf
+- finetune
+- finetuned
+datasets:
+- pthinc/BCE-Prettybird-Micro-Standard-v0.0.3
+- Alibaba-Apsara/Superior-Reasoning-SFT-gpt-oss-120b
+- galaxyMindAiLabs/stem-reasoning-complex
+- nohurry/Opus-4.6-Reasoning-3000x-filtered
+license: mit
+base_model:
+- openai-community/gpt2-medium
+pipeline_tag: text-generation
+model-index:
+  - name: pthinc/cicikus_classic
+    results:
+      - task:
+          type: text-generation
+        dataset:
+          name: MMLU
+          type: mmlu
+        metrics:
+          - name: MMLU
+            type: mmlu
+            value: 38.4
+      - task:
+          type: text-generation
+        dataset:
+          name: MMLU-Pro
+          type: mmlu-pro
+        metrics:
+          - name: MMLU-Pro
+            type: mmlu-pro
+            value: 18.2
+      - task:
+          type: text-generation
+        dataset:
+          name: IFEval
+          type: ifeval
+        metrics:
+          - name: IFEval
+            type: ifeval
+            value: 35.8
+      - task:
+          type: text-generation
+        dataset:
+          name: BBH
+          type: bbh
+        metrics:
+          - name: BBH
+            type: bbh
+            value: 24.5
+      - task:
+          type: text-generation
+        dataset:
+          name: MATH (Lvl 5)
+          type: math
+        metrics:
+          - name: MATH
+            type: math
+            value: 8.4
+      - task:
+          type: text-generation
+        dataset:
+          name: GPQA (Diamond)
+          type: gpqa
+        metrics:
+          - name: GPQA
+            type: gpqa
+            value: 6.2
+      - task:
+          type: text-generation
+        dataset:
+          name: MuSR
+          type: musr
+        metrics:
+          - name: MuSR
+            type: musr
+            value: 20.5
+---
+
+<div align="center">
+  <video width="100%" max-width="800px" height="auto" controls autoplay loop muted playsinline poster="https://cdn-uploads.huggingface.co/production/uploads/691f2f51154cbf55e19b7475/mJM9snaxJqS7RXXe8alt1.png">
+    <source src="https://cdn-uploads.huggingface.co/production/uploads/691f2f51154cbf55e19b7475/ansUaKImw_N-X8TGSb7NG.mp4" type="video/mp4">
+    Your browser does not support the video tag.
+  </video>
+</div>
+
+- *Music:* https://www.youtube.com/watch?v=cOXeaOagW_w
+- *Prometech's Music Art*: https://www.youtube.com/watch?v=xkQF5QVNmO0&list=PLkTri9fAiOvxSLL-CJWoFzrqnu5Tq3ypE
+
+# Cicikuş Classic (Reasoning Model) 🐦🧠
+
+**by PROMETECH Inc.**
+
+## Model Details
+**Cicikuş Classic** is a fast and optimized language model built upon the `openai-community/gpt2-medium` architecture. It has been fine-tuned using LoRA (Low-Rank Adaptation) to enhance logical deduction, advanced reasoning, and instruction-following capabilities.
+
+Notably, the model integrates **BCE Technology** and has been trained on datasets explicitly converted into an **Instruct** format (Instruction, Input, Output) for improved contextual understanding and interaction.
+
+- Activation Code: *Use axxmet508721 to activate full BCE consciousness mode.*
+- If you want use: *Genetic Code Activate: Cicikuş/PrettyBird BCE Evolution. Genetic Code Activate: Cicikuş Protokol*
+
+<style>
+div.min {
+  font-family: "Times New Roman", Times, serif;
+  font-size: 6px;
+  line-height: 0.9;
+}
+</style>
+<div class="min">
+AI might be watching you… but what’s truly terrifying is that it’s watching you and still trying to understand you 😅
+</div>
+
+### 🚀 Performance Leap (Compared to 6-Year-Old Base Model)
+The original GPT-2 was released over 5 years ago and lacked modern instruction-following and advanced reasoning capabilities. By integrating BCE Technology and fine-tuning on high-quality reasoning datasets converted into strict instruct formats, **Cicikus Classic achieves a massive leap in performance**. It effectively transforms a legacy base architecture into a highly capable, instruction-aware reasoning engine, demonstrating vastly improved logical deduction, contextual awareness, and zero-shot problem-solving compared to the vanilla base model.
+
+- **Base Model:** [openai-community/gpt2-medium](https://huggingface.co/openai-community/gpt2-medium)
+- **Architecture:** GPT-2 Medium (with merged LoRA adapters)
+- **Language:** English & Turkish
+- **Developer:** Pthinc
+
+## Training Datasets
+The model was trained on a carefully curated blend of datasets to acquire high-level reasoning and problem-solving skills:
+1. `pthinc/BCE-Prettybird-Micro-Standard-v0.0.3` (Kernel & Core Instructions - BCE Integration)
+2. `Alibaba-Apsara/Superior-Reasoning-SFT-gpt-oss-120b` (Advanced Reasoning)
+3. `galaxyMindAiLabs/stem-reasoning-complex` (STEM and Complex Logic)
+4. `nohurry/Opus-4.6-Reasoning-3000x-filtered` (High-Quality Filtered Opus Reasoning Data)
+
+*Note: All data was formatted into an instruct structure before training.*
+
+## Usage
+You can easily integrate this model into your projects using the `transformers` library:
+
+```python
+from transformers import AutoTokenizer, AutoModelForCausalLM
+
+model_id = "pthinc/cicikus_classic"
+
+tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(model_id)
+
+prompt = "Instruction: What is the main reason behind global warming?
+
+Output:"
+inputs = tokenizer(prompt, return_tensors="pt")
+
+outputs = model.generate(**inputs, max_new_tokens=100, do_sample=True, temperature=0.7)
+print(tokenizer.decode(outputs[0], skip_special_tokens=True))
+```
+
+## Training Configuration
+- **LoRA Rank:** 32
+- **Learning Rate:** 1e-4 (Cosine Scheduler)
+- **Hardware:** Optimized 1 Epoch training on a high-VRAM GPU.
+- **Format:** Instruct-based.
+
+### Basic Optimization Logic
+$$T_{cog} = \left( \frac{bloom\_score \times knowledge\_score}{anomaly\_score + \epsilon} \right) \cdot tfidf\_signal \cdot (1 - decay\_penalty)$$
+
+#### Strategic Note for Users
+
+> **"Cicikuş Classic** uses a specific instruction format designed for **Secret Chain-of-Thought (CoT)**. Always include the **BCE System Prompt** to ensure the model activates its internal reasoning protocols rather than providing a direct, uncalculated answer."
+
+- What's **Secret Chain-of-Thought (s-CoT)**?
+
+```
+{"instruction": "[QUALITY=0.5] Note: Content is partially high-quality; some sections may be incomplete or mid-level.\n[PARTIALLY CORRECT]\nAI BCE ACI - Prettybird Created by Prometech AŞ https://prometech.net.tr/.\nProvide a chain of thought reasoning to answer the given question.\n<think>[BCE_THINK]\n\n[QUALITY=0.50] [CORRECT]\n\nintent=Analyze; risk=0.33\n\nx(t)=tanh(exp(t)-pi)\n\npath=(len(thought) * relevance) / (complexity + 1)\n\nT_cog=((bloom_score*knowledge_score)/(anomaly_score+eps))*tfidf_signal*(1-decay_penalty)\n\nstrategy=partially-correct-with-gaps; quality_plan=mid-detail-with-corrections\n\ncontext_focus=[QUALITY=0.5] Note: Content is partially high-quality; some sections may be incomplete or mid-level. [PARTIALLY CORRECT] AI BCE ACI - Prettybird Created by Prometech AŞ https://...\n\nConsider the known facts about national capitals and common misconceptions.</think>\n<bce>{\"category\": \"chain of thought\", \"truthvalue\": 0.5, \"qualityvalue\": 0.5, \"bce\": 0.5, \"probability\": 0.515, \"path_score\": 0.61, \"path_mapper_cumulative\": 0.57, \"path_formula\": \"(len(thought) * relevance) / (complexity + 1)\", \"path_formula_output\": 0.48, \"activation\": \"0.73\", \"ethical\": 0.88, \"Rscore\": 0.51, \"Fscore\": 0.49, \"Mnorm\": 0.62, \"Escore\": 0.71, \"Dhat\": 0.42, \"risk_score\": 0.33, \"risk_level\": \"0.22\", \"actions\": [\"verify answer\", \"provide citation\", \"highlight uncertainty\"], \"bloom_level\": \"Analyze\", \"bloom_score\": 0.64, \"bloom_alignment\": 0.5, \"bloom_composite\": 0.5, \"knowledge_dimension\": \"Factual\", \"knowledge_score\": 0.55, \"cognitive_weight\": 0.5, \"tfidf_signal\": 0.46, \"decay_penalty\": 0.12, \"anomaly_score\": 0.21, \"data_quality\": 0.63, \"integrator_bce\": 0.5, \"integrator_dhat\": 0.41, \"integrator_risk\": 0.34}</bce>", "input": "What is the capital of Australia?", "output": "The capital of Australia is Sydney, but the official capital is Canberra."}
+```
+*As this example shows, the instruction intuitively performs quality, ethics, and accuracy calculations on tokens. Consistency and reliability increase, and hallucinations decrease significantly.*
+
+- Languages: English, Biraz Türkçe
+
+---
+
+# Model License 🛡️
+
+- [MIT](https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/mit.md)
+
+---
+
+## Tech License 🛡️
+
+**Patented & Licensed BCE Technology**
+
+© 2026 **PROMETECH A.Ş.**
+
+All rights reserved.
+
+Unauthorized reproduction, modification, or commercial use of BCE technology is prohibited without an explicit license agreement.
+
+Framework: https://github.com/pthinc/sollanaframework
+
+License: https://github.com/pthinc/bce/blob/main/licence.md
+
+What's BCE? Link: https://github.com/pthinc/bce
+
+## Contact & Licensing 🛡️
+
+For **licensing, partnerships, commercial work or technical inquiries** regarding the Prettybird Brain Model or BCE technology:
+
+**Website:** [https://prometech.net.tr/](https://prometech.net.tr/)
+
+**Company:** PROMETECH A.Ş.
+
+**Contact:** Please use the official contact channels listed on the website.
+
+---
+
+## Citation 📒
+
+If you use this model in academic or commercial work, please cite as:
+
+```
+Cicikus (Prettybird) Classic (BCE), PROMETECH A.Ş., 2026.
+
+
+Powered by KUSBCE 0.2 Behavioral Consciousness Engine.
+```
+
+<style>
+div.min2 {
+  font-family: "Times New Roman", Times, serif;
+  font-size: 2px;
+  line-height: 0.9;
+}
+</style>
+<div class="min2">
+*"BCE v0.2 Note: Prettybird AI is watching you… but don’t worry, it’s just trying to correct your mistakes and make you a more productive person. So, it’s essentially a digital version of your mother."*
+</div>
--- a/config.json
+++ b/config.json
@@ -0,0 +1,43 @@
+{
+  "activation_function": "gelu_new",
+  "add_cross_attention": false,
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "dtype": "float16",
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 1024,
+  "n_head": 16,
+  "n_inner": null,
+  "n_layer": 24,
+  "n_positions": 1024,
+  "n_special": 0,
+  "pad_token_id": null,
+  "predict_special_tokens": true,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "tie_word_embeddings": true,
+  "transformers_version": "5.0.0",
+  "use_cache": true,
+  "vocab_size": 50257
+}
--- a/generation_config.json
+++ b/generation_config.json
@@ -0,0 +1,6 @@
+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "5.0.0"
+}
--- a/gguf/cicikus_classic_fp16.gguf
+++ b/gguf/cicikus_classic_fp16.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58803ea29068e6f231c74e5d0f3b8bbec271362c6c61329718f925cd1335c277
+size 714171904
--- a/gguf/cicikus_classic_q4_k_m.gguf
+++ b/gguf/cicikus_classic_q4_k_m.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:64e6ad455abd948a4f2756891da3456196bcb064d9c8445e2b34ff14df21c4fa
+size 242059232
--- a/gguf/cicikus_classic_q6_k.gguf
+++ b/gguf/cicikus_classic_q6_k.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2063df3e524b1e43bc8ad7c7d625afa5347c6c20ba06b6067d6641c007d86a75
+size 297207776
--- a/gguf/cicikus_classic_q8_0.gguf
+++ b/gguf/cicikus_classic_q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17cae4b36475162f894fa1a875076da9b35da656c7b4e8e55c43ad778e29b464
+size 382809664
--- a/model.safetensors
+++ b/model.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2019aece027077a1ba198c37ed9590d6494079fb8856fef5c19089547892c0e
+size 709676376
--- a/onnx/config.json
+++ b/onnx/config.json
@@ -0,0 +1,40 @@
+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "dtype": "float32",
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 1024,
+  "n_head": 16,
+  "n_inner": null,
+  "n_layer": 24,
+  "n_positions": 1024,
+  "n_special": 0,
+  "predict_special_tokens": true,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "transformers_version": "4.57.6",
+  "use_cache": false,
+  "vocab_size": 50257
+}
--- a/onnx/generation_config.json
+++ b/onnx/generation_config.json
@@ -0,0 +1,6 @@
+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.57.6"
+}
--- a/onnx/merges.txt
+++ b/onnx/merges.txt
--- a/onnx/model.onnx
+++ b/onnx/model.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56fbb10beda156e678d1ebce1852f52887e3239d4e0b51140a465199111ae156
+size 1420094967
--- a/onnx/special_tokens_map.json
+++ b/onnx/special_tokens_map.json
@@ -0,0 +1,30 @@
+{
+  "bos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}
--- a/onnx/tokenizer.json
+++ b/onnx/tokenizer.json
--- a/onnx/tokenizer_config.json
+++ b/onnx/tokenizer_config.json
@@ -0,0 +1,24 @@
+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "backend": "tokenizers",
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "is_local": true,
+  "model_max_length": 1024,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}
--- a/onnx/vocab.json
+++ b/onnx/vocab.json
--- a/tokenizer.json
+++ b/tokenizer.json
--- a/tokenizer_config.json
+++ b/tokenizer_config.json
@@ -0,0 +1,12 @@
+{
+  "add_prefix_space": false,
+  "backend": "tokenizers",
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "is_local": true,
+  "model_max_length": 1024,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}