├── .github └── workflows │ ├── deploy-playground.yaml │ ├── quality-gate-playground.yaml │ └── template-docker.yaml ├── .gitignore ├── README.md ├── alphamaze.gif ├── api ├── api_tokens.yml ├── config.yml ├── convert.sh └── vllm_host.sh ├── benchmark ├── README.md ├── evaluator.py ├── main.py ├── models │ ├── __init__.py │ ├── base.py │ ├── hf_model.py │ ├── instruction_type.py │ ├── openai_api.py │ └── vllm_model.py ├── requirements.txt ├── run.sh └── utils.py ├── grpo_progress.png ├── inference.py ├── open_vocab.py ├── playground ├── .dockerignore ├── .gitignore ├── Dockerfile ├── README.md ├── components.json ├── eslint.config.mjs ├── maze_reasoning.jsonl ├── next.config.ts ├── package-lock.json ├── package.json ├── postcss.config.mjs ├── public │ ├── file.svg │ ├── globe.svg │ ├── next.svg │ ├── vercel.svg │ └── window.svg ├── src │ ├── app │ │ ├── _components │ │ │ └── MazeSolver.tsx │ │ ├── api │ │ │ └── chat │ │ │ │ └── route.ts │ │ ├── favicon.ico │ │ ├── globals.css │ │ ├── layout.tsx │ │ └── page.tsx │ ├── components │ │ └── ui │ │ │ ├── button.tsx │ │ │ ├── card.tsx │ │ │ ├── tabs.tsx │ │ │ └── textarea.tsx │ └── lib │ │ └── utils.ts ├── tailwind.config.ts └── tsconfig.json ├── synthetic_maze.py ├── synthetic_maze_token.py ├── synthetic_reset_maze.py ├── training ├── Llama-factory-config │ ├── Qwen2.5_1.5B_distil.yaml │ ├── dataset_info.json │ └── qwen2_5_7B_R1_full_sft.yaml ├── grpo_stage.py ├── grpo_train.sh ├── load_push.py └── requirements.txt └── utils.py /.github/workflows/deploy-playground.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/.github/workflows/deploy-playground.yaml -------------------------------------------------------------------------------- /.github/workflows/quality-gate-playground.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/.github/workflows/quality-gate-playground.yaml -------------------------------------------------------------------------------- /.github/workflows/template-docker.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/.github/workflows/template-docker.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/README.md -------------------------------------------------------------------------------- /alphamaze.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/alphamaze.gif -------------------------------------------------------------------------------- /api/api_tokens.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/api/api_tokens.yml -------------------------------------------------------------------------------- /api/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/api/config.yml -------------------------------------------------------------------------------- /api/convert.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/api/convert.sh -------------------------------------------------------------------------------- /api/vllm_host.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/api/vllm_host.sh -------------------------------------------------------------------------------- /benchmark/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/README.md -------------------------------------------------------------------------------- /benchmark/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/evaluator.py -------------------------------------------------------------------------------- /benchmark/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/main.py -------------------------------------------------------------------------------- /benchmark/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /benchmark/models/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/models/base.py -------------------------------------------------------------------------------- /benchmark/models/hf_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/models/hf_model.py -------------------------------------------------------------------------------- /benchmark/models/instruction_type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/models/instruction_type.py -------------------------------------------------------------------------------- /benchmark/models/openai_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/models/openai_api.py -------------------------------------------------------------------------------- /benchmark/models/vllm_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/models/vllm_model.py -------------------------------------------------------------------------------- /benchmark/requirements.txt: -------------------------------------------------------------------------------- 1 | vllm 2 | openai 3 | transformers 4 | torch 5 | datasets -------------------------------------------------------------------------------- /benchmark/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/run.sh -------------------------------------------------------------------------------- /benchmark/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/benchmark/utils.py -------------------------------------------------------------------------------- /grpo_progress.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/grpo_progress.png -------------------------------------------------------------------------------- /inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/inference.py -------------------------------------------------------------------------------- /open_vocab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/open_vocab.py -------------------------------------------------------------------------------- /playground/.dockerignore: -------------------------------------------------------------------------------- 1 | node_modules 2 | .next 3 | package-lock.json 4 | -------------------------------------------------------------------------------- /playground/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/.gitignore -------------------------------------------------------------------------------- /playground/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/Dockerfile -------------------------------------------------------------------------------- /playground/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/README.md -------------------------------------------------------------------------------- /playground/components.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/components.json -------------------------------------------------------------------------------- /playground/eslint.config.mjs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/eslint.config.mjs -------------------------------------------------------------------------------- /playground/maze_reasoning.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/maze_reasoning.jsonl -------------------------------------------------------------------------------- /playground/next.config.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/next.config.ts -------------------------------------------------------------------------------- /playground/package-lock.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/package-lock.json -------------------------------------------------------------------------------- /playground/package.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/package.json -------------------------------------------------------------------------------- /playground/postcss.config.mjs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/postcss.config.mjs -------------------------------------------------------------------------------- /playground/public/file.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/public/file.svg -------------------------------------------------------------------------------- /playground/public/globe.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/public/globe.svg -------------------------------------------------------------------------------- /playground/public/next.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/public/next.svg -------------------------------------------------------------------------------- /playground/public/vercel.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/public/vercel.svg -------------------------------------------------------------------------------- /playground/public/window.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/public/window.svg -------------------------------------------------------------------------------- /playground/src/app/_components/MazeSolver.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/_components/MazeSolver.tsx -------------------------------------------------------------------------------- /playground/src/app/api/chat/route.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/api/chat/route.ts -------------------------------------------------------------------------------- /playground/src/app/favicon.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/favicon.ico -------------------------------------------------------------------------------- /playground/src/app/globals.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/globals.css -------------------------------------------------------------------------------- /playground/src/app/layout.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/layout.tsx -------------------------------------------------------------------------------- /playground/src/app/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/app/page.tsx -------------------------------------------------------------------------------- /playground/src/components/ui/button.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/components/ui/button.tsx -------------------------------------------------------------------------------- /playground/src/components/ui/card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/components/ui/card.tsx -------------------------------------------------------------------------------- /playground/src/components/ui/tabs.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/components/ui/tabs.tsx -------------------------------------------------------------------------------- /playground/src/components/ui/textarea.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/components/ui/textarea.tsx -------------------------------------------------------------------------------- /playground/src/lib/utils.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/src/lib/utils.ts -------------------------------------------------------------------------------- /playground/tailwind.config.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/tailwind.config.ts -------------------------------------------------------------------------------- /playground/tsconfig.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/playground/tsconfig.json -------------------------------------------------------------------------------- /synthetic_maze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/synthetic_maze.py -------------------------------------------------------------------------------- /synthetic_maze_token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/synthetic_maze_token.py -------------------------------------------------------------------------------- /synthetic_reset_maze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/synthetic_reset_maze.py -------------------------------------------------------------------------------- /training/Llama-factory-config/Qwen2.5_1.5B_distil.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/Llama-factory-config/Qwen2.5_1.5B_distil.yaml -------------------------------------------------------------------------------- /training/Llama-factory-config/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/Llama-factory-config/dataset_info.json -------------------------------------------------------------------------------- /training/Llama-factory-config/qwen2_5_7B_R1_full_sft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/Llama-factory-config/qwen2_5_7B_R1_full_sft.yaml -------------------------------------------------------------------------------- /training/grpo_stage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/grpo_stage.py -------------------------------------------------------------------------------- /training/grpo_train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/grpo_train.sh -------------------------------------------------------------------------------- /training/load_push.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/training/load_push.py -------------------------------------------------------------------------------- /training/requirements.txt: -------------------------------------------------------------------------------- 1 | unsloth 2 | vllm 3 | tensorboard 4 | -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/janhq/visual-thinker/HEAD/utils.py --------------------------------------------------------------------------------