├── .dockerignore
├── .eslintignore
├── .eslintrc
├── .gitignore
├── .npmrc
├── Cargo.lock
├── Cargo.toml
├── Cross.toml
├── LICENSE
├── README.md
├── docs
    ├── DEPLOY_INSTANCE.md
    ├── DEPLOY_WORKER.md
    └── DEVELOPER.md
├── img_hash
    ├── Cargo.toml
    ├── LICENSE-APACHE
    ├── LICENSE-MIT
    └── src
    │   ├── alg
    │       ├── blockhash.rs
    │       └── mod.rs
    │   ├── bin
    │       └── hash_image.rs
    │   ├── dct.rs
    │   ├── fr.rs
    │   ├── lib.rs
    │   └── traits.rs
├── migrations
    ├── 0000_init.sql
    ├── 0001_source_size.sql
    └── 0002_source_size_trigger.sql
├── package.json
├── pnpm-lock.yaml
├── pnpm-workspace.yaml
├── proto-rs
    ├── Cargo.toml
    ├── build.rs
    └── src
    │   └── lib.rs
├── proto
    └── gateway.mit.proto
├── rust-toolchain.toml
├── rustfmt.toml
├── services
    ├── inpainting_lama_v1
    │   ├── inpainting.py
    │   ├── main.py
    │   └── models.py
    ├── mask_refinement_v1
    │   ├── main.py
    │   ├── models.py
    │   ├── text_mask_utils.py
    │   └── utils.py
    ├── models
    │   ├── Cargo.lock
    │   ├── Cargo.toml
    │   └── src
    │   │   └── lib.rs
    ├── ocr_ctc_v1
    │   ├── alphabet-all-v5.txt
    │   ├── main.py
    │   ├── models.py
    │   ├── ocr.py
    │   └── utils.py
    ├── phash
    │   ├── Cargo.lock
    │   ├── Cargo.toml
    │   └── src
    │   │   └── main.rs
    ├── text_detection_v1
    │   ├── craft_utils.py
    │   ├── dbnet_utils.py
    │   ├── detector.py
    │   ├── main.py
    │   ├── models.py
    │   └── utils.py
    ├── textline_merge_v1
    │   ├── main.py
    │   ├── models.py
    │   ├── textline_merge.py
    │   └── utils.py
    └── wasm
    │   ├── .gitignore
    │   ├── Cargo.toml
    │   ├── rust-toolchain
    │   └── src
    │       ├── lib.rs
    │       └── utils.rs
├── specs
    └── cotrans.yaml
├── types
    ├── .gitignore
    ├── LICENSE
    ├── package.json
    ├── src
    │   └── index.ts
    └── tsconfig.json
├── uno.config.ts
├── userscript
    ├── .gitignore
    ├── .vscode
    │   ├── i18n-ally-custom-framework.yml
    │   └── settings.json
    ├── package.json
    ├── rollup.config.js
    ├── src
    │   ├── banner-nsfw.js
    │   ├── banner-regular.js
    │   ├── eHentai
    │   │   ├── gallery.ts
    │   │   ├── page.ts
    │   │   └── settings.ts
    │   ├── i18n
    │   │   ├── en-US.yml
    │   │   ├── index.ts
    │   │   └── zh-CN.yml
    │   ├── main-nsfw.ts
    │   ├── main-regular.ts
    │   ├── main.ts
    │   ├── misskey
    │   │   └── index.tsx
    │   ├── pixiv
    │   │   ├── index.tsx
    │   │   └── settings.tsx
    │   ├── settings
    │   │   └── index.tsx
    │   ├── shims.d.ts
    │   ├── twitter
    │   │   ├── index.tsx
    │   │   └── settings.tsx
    │   └── utils
    │   │   ├── core.ts
    │   │   ├── index.ts
    │   │   ├── storage.ts
    │   │   └── twind.ts
    ├── tsconfig.json
    └── vitest.config.ts
├── web
    ├── .gitignore
    ├── app.vue
    ├── components
    │   ├── footer
    │   │   └── index.vue
    │   ├── nav
    │   │   └── index.vue
    │   └── u
    │   │   └── Listbox.vue
    ├── layouts
    │   └── default.vue
    ├── nuxt.config.ts
    ├── package.json
    ├── pages
    │   ├── index.vue
    │   └── userscript.vue
    └── tsconfig.json
├── wk-gateway
    ├── .gitignore
    ├── buf.gen.yaml
    ├── build.config.ts
    ├── package.json
    ├── shims.d.ts
    ├── src
    │   ├── db.ts
    │   ├── index.ts
    │   ├── mitWorker
    │   │   ├── dObject.ts
    │   │   ├── id.ts
    │   │   ├── index.ts
    │   │   └── ttl.ts
    │   ├── task
    │   │   ├── index.ts
    │   │   └── upload.ts
    │   ├── types.ts
    │   └── utils
    │   │   ├── index.ts
    │   │   ├── memo.ts
    │   │   └── png.ts
    ├── tsconfig.json
    ├── wrangler.domitworker.toml
    └── wrangler.toml
├── wk-image
    ├── .gitignore
    ├── Cargo.toml
    ├── package.json
    ├── src
    │   └── lib.rs
    └── wrangler.toml
└── wkr2
    ├── .gitignore
    ├── .prettierrc
    ├── README.md
    ├── package.json
    ├── src
        └── index.ts
    ├── tsconfig.json
    └── wrangler.toml


/.dockerignore:
--------------------------------------------------------------------------------
1 | local-tests
2 | *.ckpt
3 | *.pyc
4 | __pycache__
5 | target/
6 | 


--------------------------------------------------------------------------------
/.eslintignore:
--------------------------------------------------------------------------------
1 | /wk-image/build/
2 | /target/
3 | 


--------------------------------------------------------------------------------
/.eslintrc:
--------------------------------------------------------------------------------
1 | {
2 |   "extends": ["@antfu"],
3 |   "ignorePatterns": ["/wk-gateway/src/protoGen"]
4 | }
5 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | .DS_Store
 2 | 
 3 | local-tests
 4 | *.ckpt
 5 | *.pyc
 6 | __pycache__
 7 | 
 8 | target/
 9 | node_modules
10 | 
11 | /gateway/src/prisma.rs
12 | /wk-gateway/src/protoGen
13 | 


--------------------------------------------------------------------------------
/.npmrc:
--------------------------------------------------------------------------------
1 | shamefully-hoist=true
2 | ignore-workspace-root-check=true
3 | 


--------------------------------------------------------------------------------
/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [workspace]
 2 | resolver = "2"
 3 | members = ["proto-rs", "wk-image", "img_hash"]
 4 | 
 5 | [workspace.package]
 6 | edition = "2021"
 7 | rust-version = "1.71.0"
 8 | 
 9 | [profile.release]
10 | lto = true
11 | strip = true
12 | codegen-units = 1
13 | 


--------------------------------------------------------------------------------
/Cross.toml:
--------------------------------------------------------------------------------
1 | [target.x86_64-unknown-linux-musl]
2 | pre-build = [
3 |   "apt-get update && apt-get install --assume-yes protobuf-compiler",
4 | ]
5 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Cotrans
 2 | 
 3 | A working-in-progress collaborative online image/manga translation platform base on
 4 | [manga-image-translator](https://github.com/zyddnys/manga-image-translator).
 5 | 
 6 | ## Contributing
 7 | 
 8 | ### Repository structure
 9 | 
10 | | Path         | Description                |
11 | | ------------ | -------------------------- |
12 | | `docs`       | Documentations             |
13 | | `specs`      | OpenAPI specs (TODO)       |
14 | | `proto`      | Protobuf definitions       |
15 | | `proto-rs`   | Prost definitions          |
16 | | `migrations` | Database migrations        |
17 | | `types`      | TypeScript definitions     |
18 | | `wk-gateway` | Gateway worker             |
19 | | `wk-image`   | Image processing worker    |
20 | | `img_hash`   | Fork of `image_hasher`     |
21 | | `wkr2`       | R2 worker (private/public) |
22 | | `web`        | Website                    |
23 | | `web-ext`    | Browser extension          |
24 | | `userscript` | UserScript                 |
25 | 


--------------------------------------------------------------------------------
/docs/DEPLOY_INSTANCE.md:
--------------------------------------------------------------------------------
  1 | # Instance Deploy Guide
  2 | 
  3 | This guide is exclusively designed for developers who are interested in deploying
  4 | their own version of Cotrans. If your intention is to process images on your personal computer,
  5 | you should instead refer to the [Translation Worker Deploy Guide](./DEPLOY_WORKER.md).
  6 | 
  7 | ## Requirements
  8 | 
  9 | You must have:
 10 | 
 11 | - A Cloudflare account
 12 |   - with an active zone (domain)
 13 |     - if nameserver changes haven't been applied, wait for it first
 14 |   - with Workers Paid plan (<https://dash.cloudflare.com/?to=/:account/workers/plans>)
 15 |   - with Durable Objects activated (from the bottom of any Worker's page)
 16 |   - with R2 plan (<https://dash.cloudflare.com/?to=/:account/r2/plans>)
 17 | - Any Linux server (to process tasks)
 18 |   - with Python 3.8+ installed
 19 |   - if equipped with Nvidia GPU, with the latest PyTorch + CUDA installed
 20 |   - recommended minimum 28GB RAM, or 16GB RAM with 16GB GPU VRAM
 21 |   - exposing to the Internet is *not* required
 22 | 
 23 | ## Preparation
 24 | 
 25 | Install the following tools:
 26 | 
 27 | - Node.js 18+ (<https://nodejs.org/download/current/>)
 28 |   - with `pnpm` (<https://pnpm.io/installation>)
 29 |   - with `wrangler` (`pnpm i -g wrangler`)
 30 | - Rust 1.68+ (<https://rustup.rs/>)
 31 | 
 32 | ```bash
 33 | # Generate a pair of ECDSA private/public key (to sign/verify JWT)
 34 | # Results will be saved in `private.pem` and `public.pem`
 35 | openssl ecparam -name prime256v1 -genkey -noout | tee >(openssl ec -pubout -out public.pem) | openssl pkcs8 -topk8 -nocrypt -out private.pem
 36 | 
 37 | # Clone the repo
 38 | git clone https://github.com/VoileLabs/cotrans
 39 | cd cotrans
 40 | 
 41 | # Install dependencies
 42 | cargo check
 43 | pnpm i
 44 | 
 45 | # Build the project
 46 | pnpm build
 47 | ```
 48 | 
 49 | ## Deploy R2 buckets and `wkr2`
 50 | 
 51 | Create two R2 buckets in Cloudflare dashboard: `cotrans-public`, `cotrans-private`.
 52 | 
 53 | Bind a custom domain to the `cotrans-public` bucket.
 54 | This domain will be referred as `r2.cotrans.example.com` in the following steps.
 55 | 
 56 | Add a CORS policy, with `GET` method allowed.
 57 | 
 58 | An example policy:
 59 | 
 60 | ```json
 61 | [
 62 |   {
 63 |     "AllowedOrigins": [
 64 |       "*"
 65 |     ],
 66 |     "AllowedMethods": [
 67 |       "GET"
 68 |     ],
 69 |     "AllowedHeaders": [
 70 |       "*"
 71 |     ],
 72 |     "ExposeHeaders": [
 73 |       "ETag"
 74 |     ],
 75 |     "MaxAgeSeconds": 600
 76 |   }
 77 | ]
 78 | ```
 79 | 
 80 | Run the following commands to deploy `cotrans-wkr2-public` and `cotrans-wkr2-private`:
 81 | 
 82 | ```bash
 83 | cd wkr2
 84 | wrangler deploy --keep-vars
 85 | wrangler deploy --keep-vars --env private
 86 | ```
 87 | 
 88 | Open the settings page of both workers, click "Variables", and add the following environment variables:
 89 | 
 90 | - `JWT_PUBLIC_KEY`: the content of `public.pem`
 91 | - `JWT_AUDIENCE`: `wk:r2:private` for `cotrans-wkr2-private`, `wk:r2:public` for `cotrans-wkr2-public`
 92 | 
 93 | Scroll down to the "R2 Bucket Bindings" section, ensure a bucket is bound to `BUCKET`.
 94 | If not, click "Edit variable" and add a bucket named `BUCKET`, to `cotrans-public` for `wkr2-public`, `cotrans-private` for `wkr2-private`.
 95 | 
 96 | Open the triggers page, add a custom domain for each worker.
 97 | The domains will be referred as `public.r2.wk.cotrans.example.com` and `private.r2.wk.cotrans.example.com` in the following steps.
 98 | 
 99 | Both workers are recommended be in "Bundled" usage model.
100 | 
101 | ## Deploy `wk-image`
102 | 
103 | Run the following commands to deploy `wk-image`:
104 | 
105 | ```bash
106 | cd wk-image
107 | wrangler deploy --keep-vars
108 | ```
109 | 
110 | Open the settings page of the worker, ensure a bucket is bound to `BUCKET_PRI`.
111 | If not, click "Edit variable" and add a bucket named `BUCKET_PRI`, to `cotrans-private`.
112 | 
113 | The worker must be in "Unbound" usage model.
114 | 
115 | ## Deploy `wk-gateway`
116 | 
117 | Create a D1 database in Cloudflare dashboard, named `cotrans`.
118 | 
119 | Edit `wk-gateway/wrangler.toml`, replace the value of `database_id` with the ID of the database.
120 | 
121 | Edit `wk-gateway/src/index.ts`, put the domain for `web` inside `CORS_ORIGINS`.
122 | 
123 | Run the following commands to deploy `cotrans-wk-gateway`:
124 | 
125 | ```bash
126 | cd wk-gateway
127 | wrangler d1 migrations apply DB --experimental-backend
128 | wrangler deploy --keep-vars -c wrangler.domitworker.toml
129 | wrangler deploy --keep-vars
130 | ```
131 | 
132 | This should produce two workers: `cotrans-wk-gateway-domitworker` and `cotrans-wk-gateway`.
133 | 
134 | Open the settings page of both workers, do the following:
135 | 
136 | - Click "Variables", and add the following environment variables:
137 |   - `JWT_PRIVATE_KEY`: the content of `private.pem`
138 |   - `JWT_PUBLIC_KEY`: the content of `public.pem`
139 |   - `MIT_WORKERS_SECRET`: a random string, used by the Linux server to authenticate itself
140 |     - Try using a password generator if you don't know what to put
141 |   - `WKR2_PRIVATE_BASE`: `https://private.r2.wk.cotrans.example.com`
142 |   - `WKR2_PUBLIC_BASE`: `https://public.r2.wk.cotrans.example.com`
143 |   - `WKR2_PUBLIC_EXPOSED_BASE`: `https://r2.cotrans.example.com`
144 | - Scroll down to the "Durable Object Bindings" section, ensure the following bindings exist:
145 |   - `doMitWorker`: bind to `cotrans-wk-gateway-domitworker_DOMitWorker`
146 |   - `doImage`: bind to `cotrans-wk-image_DOImage`
147 |   - If not, click "Edit variable" and add the bindings.
148 | - Scroll down to the "Service Bindings" section, ensure the following bindings exist:
149 |   - `wkr2_private`: bind to `cotrans-wkr2-private`
150 |   - `wkr2_public`: bind to `cotrans-wkr2-public`
151 |   - If not, click "Edit variable" and add the bindings.
152 | - On `cotrans-wk-gateway`, open the triggers page, add a custom domain, this will be the api domain.
153 |   - The domain will be referred as `gateway.wk.cotrans.example.com` in the following steps.
154 | 
155 | Both workers are recommended be in "Bundled" usage model.
156 | 
157 | ## Deploy `web`
158 | 
159 | Run the following commands to deploy `web`:
160 | 
161 | ```bash
162 | cd web
163 | NUXT_PUBLIC_API_BASE=https://gateway.wk.cotrans.example.com NUXT_PUBLIC_WS_BASE=wss://gateway.wk.cotrans.example.com pnpm generate
164 | wrangler pages deploy .output/public
165 | ```
166 | 
167 | Bind a custom domain to the worker, this will be the website domain.
168 | 
169 | ## Deploy mit workers
170 | 
171 | SSH into the Linux server, follow the instructions in <https://github.com/zyddnys/manga-image-translator#installation>.
172 | 
173 | Set the api keys in `.env` file for translation services you plan to use.
174 | 
175 | Replace `<MIT_WORKERS_SECRET>` in the following commands with the value of `MIT_WORKERS_SECRET` in `cotrans-wk-gateway`'s environment variables.
176 | 
177 | ```bash
178 | WS_SECRET=<MIT_WORKERS_SECRET> python -m manga_translator --use-cuda --mode ws --ws-url wss://gateway.wk.cotrans.example.com/mit/worker_ws
179 | ```
180 | 
181 | Congratulations! Your website should be able to translate images now.
182 | 


--------------------------------------------------------------------------------
/docs/DEPLOY_WORKER.md:
--------------------------------------------------------------------------------
1 | # Translation Worker Deploy Guide
2 | 
3 | > TODO (not yet implemented)
4 | 
5 | This guide will assist you in setting up a Translation Worker.
6 | Once set up, you can link it to your Cotrans dashboard to process your own images.
7 | 


--------------------------------------------------------------------------------
/docs/DEVELOPER.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/VoileLabs/cotrans/08992fa0d89e40f22477e90a361823942f2f8c86/docs/DEVELOPER.md


--------------------------------------------------------------------------------
/img_hash/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | 
 3 | name = "image_hasher"
 4 | version = "1.2.0"
 5 | edition.workspace = true
 6 | rust-version.workspace = true
 7 | license = "MIT OR Apache-2.0"
 8 | publish = false
 9 | 
10 | authors = [
11 |   "Rafał Mikrut <mikrutrafal@protonmail.com>",
12 |   "Austin Bonander <austin.bonander@gmail.com>",
13 | ]
14 | description = "A simple library that provides perceptual hashing and difference calculation for images."
15 | documentation = "http://docs.rs/image_hasher"
16 | keywords = ["image", "hash", "perceptual", "difference"]
17 | repository = "http://github.com/qarmin/img_hash"
18 | readme = "README.md"
19 | 
20 | [features]
21 | nightly = []
22 | 
23 | [dependencies]
24 | base64 = "0.21.2"
25 | image = { version = "0.24.6", default-features = false }
26 | fast_image_resize = "2.7.3"
27 | rustdct = "0.7"
28 | serde = { version = "1.0", features = ["derive"] }
29 | transpose = "0.2"
30 | 
31 | [dev-dependencies]
32 | criterion = "0.5.1"
33 | rand = { version = "0.8", features = ["small_rng"] }
34 | 
35 | [[bin]]
36 | name = "hash_image"
37 | 


--------------------------------------------------------------------------------
/img_hash/LICENSE-MIT:
--------------------------------------------------------------------------------
 1 | Copyright (c) 2015-2017 The `img_hash` Crate Developers
 2 | 
 3 | Permission is hereby granted, free of charge, to any
 4 | person obtaining a copy of this software and associated
 5 | documentation files (the "Software"), to deal in the
 6 | Software without restriction, including without
 7 | limitation the rights to use, copy, modify, merge,
 8 | publish, distribute, sublicense, and/or sell copies of
 9 | the Software, and to permit persons to whom the Software
10 | is furnished to do so, subject to the following
11 | conditions:
12 | 
13 | The above copyright notice and this permission notice
14 | shall be included in all copies or substantial portions
15 | of the Software.
16 | 
17 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF
18 | ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
19 | TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
20 | PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
21 | SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
22 | CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 | OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
24 | IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25 | DEALINGS IN THE SOFTWARE.
26 | 


--------------------------------------------------------------------------------
/img_hash/src/alg/blockhash.rs:
--------------------------------------------------------------------------------
  1 | use std::cmp::Ordering;
  2 | use std::mem;
  3 | use std::ops::AddAssign;
  4 | 
  5 | // Implementation adapted from Python version:
  6 | // https://github.com/commonsmachinery/blockhash-python/blob/e8b009d/blockhash.py
  7 | // Main site: http://blockhash.io
  8 | use image::{GenericImageView, Pixel};
  9 | 
 10 | use crate::BitSet;
 11 | use crate::{HashBytes, Image};
 12 | 
 13 | const FLOAT_EQ_MARGIN: f32 = 0.001;
 14 | 
 15 | pub fn blockhash<I: Image, B: HashBytes>(img: &I, width: u32, height: u32) -> B {
 16 |   assert_eq!(width % 4, 0, "width must be multiple of 4");
 17 |   assert_eq!(height % 4, 0, "height must be multiple of 4");
 18 | 
 19 |   let (iwidth, iheight) = img.dimensions();
 20 | 
 21 |   // Skip the floating point math if it's unnecessary
 22 |   if iwidth % width == 0 && iheight % height == 0 {
 23 |     blockhash_fast(img, width, height)
 24 |   } else {
 25 |     blockhash_slow(img, width, height)
 26 |   }
 27 | }
 28 | 
 29 | macro_rules! gen_hash {
 30 |   ($imgty:ty, $valty:ty, $blocks: expr, $width:expr, $block_width:expr, $block_height:expr, $eq_fn:expr) => {{
 31 |     #[allow(deprecated)] // deprecated as of 0.22
 32 |     let channel_count = <<$imgty as GenericImageView>::Pixel as Pixel>::CHANNEL_COUNT as u32;
 33 | 
 34 |     let group_len = ($width * 4) as usize;
 35 | 
 36 |     let block_area = $block_width * $block_height;
 37 | 
 38 |     let cmp_factor = match channel_count {
 39 |       3 | 4 => 255u32 as $valty * 3u32 as $valty,
 40 |       2 | 1 => 255u32 as $valty,
 41 |       _ => panic!("Unrecognized channel count from Image: {}", channel_count),
 42 |     } * block_area
 43 |       / (2u32 as $valty);
 44 | 
 45 |     let medians: Vec<$valty> = $blocks.chunks(group_len).map(get_median).collect();
 46 | 
 47 |     BitSet::from_bools(
 48 |       $blocks
 49 |         .chunks(group_len)
 50 |         .zip(medians)
 51 |         .flat_map(|(blocks, median)| {
 52 |           blocks
 53 |             .iter()
 54 |             .map(move |&block| block > median || ($eq_fn(block, median) && median > cmp_factor))
 55 |         }),
 56 |     )
 57 |   }};
 58 | }
 59 | 
 60 | fn block_adder<'a, T: AddAssign + 'a>(
 61 |   blocks: &'a mut [T],
 62 |   width: u32,
 63 | ) -> impl FnMut(u32, u32, T) + 'a {
 64 |   move |x, y, add| (blocks[(y as usize) * (width as usize) + (x as usize)] += add)
 65 | }
 66 | 
 67 | fn blockhash_slow<I: Image, B: HashBytes>(img: &I, hwidth: u32, hheight: u32) -> B {
 68 |   let mut blocks = vec![0f32; (hwidth * hheight) as usize];
 69 | 
 70 |   let (iwidth, iheight) = img.dimensions();
 71 | 
 72 |   // Block dimensions, in pixels
 73 |   let (block_width, block_height) = (
 74 |     iwidth as f32 / hwidth as f32,
 75 |     iheight as f32 / hheight as f32,
 76 |   );
 77 | 
 78 |   img.foreach_pixel8(|x, y, px| {
 79 |     let mut add_to_block = block_adder(&mut blocks, hwidth);
 80 | 
 81 |     let px_sum = sum_px(px) as f32;
 82 | 
 83 |     let (x, y) = (x as f32, y as f32);
 84 | 
 85 |     let block_x = x / block_width;
 86 |     let block_y = y / block_height;
 87 | 
 88 |     let x_mod = x + 1. % block_width;
 89 |     let y_mod = y + 1. % block_height;
 90 | 
 91 |     // terminology is mostly arbitrary as long as we're consistent
 92 |     // if `x` evenly divides `block_height`, this weight will be 0
 93 |     // so we don't double the sum as `block_top` will equal `block_bottom`
 94 |     let weight_left = x_mod.fract();
 95 |     let weight_right = 1. - weight_left;
 96 |     let weight_top = y_mod.fract();
 97 |     let weight_bottom = 1. - weight_top;
 98 | 
 99 |     let block_left = block_x.floor() as u32;
100 |     let block_top = block_y.floor() as u32;
101 | 
102 |     let block_right = if x_mod.trunc() == 0. {
103 |       block_x.ceil() as u32
104 |     } else {
105 |       block_left
106 |     };
107 | 
108 |     let block_bottom = if y_mod.trunc() == 0. {
109 |       block_y.ceil() as u32
110 |     } else {
111 |       block_top
112 |     };
113 | 
114 |     add_to_block(block_left, block_top, px_sum * weight_left * weight_top);
115 |     add_to_block(
116 |       block_left,
117 |       block_bottom,
118 |       px_sum * weight_left * weight_bottom,
119 |     );
120 |     add_to_block(block_right, block_top, px_sum * weight_right * weight_top);
121 |     add_to_block(
122 |       block_right,
123 |       block_bottom,
124 |       px_sum * weight_right * weight_bottom,
125 |     );
126 |   });
127 | 
128 |   gen_hash!(
129 |     I,
130 |     f32,
131 |     blocks,
132 |     hwidth,
133 |     block_width,
134 |     block_height,
135 |     |l: f32, r: f32| (l - r).abs() < FLOAT_EQ_MARGIN
136 |   )
137 | }
138 | 
139 | fn blockhash_fast<I: Image, B: HashBytes>(img: &I, hwidth: u32, hheight: u32) -> B {
140 |   let mut blocks = vec![0u32; (hwidth * hheight) as usize];
141 |   let (iwidth, iheight) = img.dimensions();
142 | 
143 |   let (block_width, block_height) = (iwidth / hwidth, iheight / hheight);
144 | 
145 |   img.foreach_pixel8(|x, y, px| {
146 |     let mut add_to_block = block_adder(&mut blocks, hwidth);
147 | 
148 |     let px_sum = sum_px(px);
149 | 
150 |     let block_x = x / block_width;
151 |     let block_y = y / block_height;
152 | 
153 |     add_to_block(block_x, block_y, px_sum);
154 |   });
155 | 
156 |   gen_hash!(I, u32, blocks, hwidth, block_width, block_height, |l, r| l
157 |     == r)
158 | }
159 | 
160 | #[inline(always)]
161 | fn sum_px(chans: &[u8]) -> u32 {
162 |   // Branch prediction should eliminate the match after a few iterations
163 |   match chans.len() {
164 |     4 => {
165 |       if chans[3] == 0 {
166 |         255 * 3
167 |       } else {
168 |         sum_px(&chans[..3])
169 |       }
170 |     }
171 |     3 => chans.iter().map(|&x| x as u32).sum(),
172 |     2 => {
173 |       if chans[1] == 0 {
174 |         255
175 |       } else {
176 |         chans[0] as u32
177 |       }
178 |     }
179 |     1 => chans[0] as u32,
180 |     channels => panic!("Unsupported channel count in image: {channels}"),
181 |   }
182 | }
183 | 
184 | fn get_median<T: PartialOrd + Copy>(data: &[T]) -> T {
185 |   let mut scratch = data.to_owned();
186 |   let median = scratch.len() / 2;
187 |   *qselect_inplace(&mut scratch, median)
188 | }
189 | 
190 | const SORT_THRESH: usize = 8;
191 | 
192 | fn qselect_inplace<T: PartialOrd>(data: &mut [T], k: usize) -> &mut T {
193 |   let len = data.len();
194 | 
195 |   assert!(
196 |     k < len,
197 |     "Called qselect_inplace with k = {k} and data length: {len}",
198 |   );
199 | 
200 |   if len < SORT_THRESH {
201 |     data.sort_by(|left, right| left.partial_cmp(right).unwrap_or(Ordering::Less));
202 |     return &mut data[k];
203 |   }
204 | 
205 |   let pivot_idx = partition(data);
206 |   match k.cmp(&pivot_idx) {
207 |     Ordering::Less => qselect_inplace(&mut data[..pivot_idx], k),
208 |     Ordering::Equal => &mut data[pivot_idx],
209 |     Ordering::Greater => qselect_inplace(&mut data[pivot_idx + 1..], k - pivot_idx - 1),
210 |   }
211 | }
212 | 
213 | fn partition<T: PartialOrd>(data: &mut [T]) -> usize {
214 |   let len = data.len();
215 | 
216 |   let pivot_idx = {
217 |     let first = (&data[0], 0);
218 |     let mid = (&data[len / 2], len / 2);
219 |     let last = (&data[len - 1], len - 1);
220 | 
221 |     median_of_3(&first, &mid, &last).1
222 |   };
223 | 
224 |   data.swap(pivot_idx, len - 1);
225 | 
226 |   let mut curr = 0;
227 | 
228 |   for i in 0..len - 1 {
229 |     if data[i] < data[len - 1] {
230 |       data.swap(i, curr);
231 |       curr += 1;
232 |     }
233 |   }
234 | 
235 |   data.swap(curr, len - 1);
236 | 
237 |   curr
238 | }
239 | 
240 | fn median_of_3<T: PartialOrd>(mut x: T, mut y: T, mut z: T) -> T {
241 |   if x > y {
242 |     mem::swap(&mut x, &mut y);
243 |   }
244 | 
245 |   if x > z {
246 |     mem::swap(&mut x, &mut z);
247 |   }
248 | 
249 |   if x > z {
250 |     mem::swap(&mut y, &mut z);
251 |   }
252 | 
253 |   y
254 | }
255 | 


--------------------------------------------------------------------------------
/img_hash/src/alg/mod.rs:
--------------------------------------------------------------------------------
  1 | #![allow(clippy::needless_lifetimes)]
  2 | use crate::CowImage::*;
  3 | use crate::HashVals::*;
  4 | use crate::{BitSet, HashCtxt, Image};
  5 | 
  6 | use self::HashAlg::*;
  7 | 
  8 | mod blockhash;
  9 | 
 10 | /// Hash algorithms implemented by this crate.
 11 | ///
 12 | /// Implemented primarily based on the high-level descriptions on the blog Hacker Factor
 13 | /// written by Dr. Neal Krawetz: http://www.hackerfactor.com/
 14 | ///
 15 | /// Note that `hash_width` and `hash_height` in these docs refer to the parameters of
 16 | /// [`HasherConfig::hash_size()`](struct.HasherConfig.html#method.hash_size).
 17 | ///
 18 | /// ### Choosing an Algorithm
 19 | /// Each algorithm has different performance characteristics
 20 | #[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize)]
 21 | pub enum HashAlg {
 22 |   /// The Mean hashing algorithm.
 23 |   ///
 24 |   /// The image is converted to grayscale, scaled down to `hash_width x hash_height`,
 25 |   /// the mean pixel value is taken, and then the hash bits are generated by comparing
 26 |   /// the pixels of the descaled image to the mean.
 27 |   ///
 28 |   /// This is the most basic hash algorithm supported, resistant only to changes in
 29 |   /// resolution, aspect ratio, and overall brightness.
 30 |   ///
 31 |   /// Further Reading:
 32 |   /// http://www.hackerfactor.com/blog/?/archives/432-Looks-Like-It.html
 33 |   Mean,
 34 | 
 35 |   /// The Gradient hashing algorithm.
 36 |   ///
 37 |   /// The image is converted to grayscale, scaled down to `(hash_width + 1) x hash_height`,
 38 |   /// and then in row-major order the pixels are compared with each other, setting bits
 39 |   /// in the hash for each comparison. The extra pixel is needed to have `hash_width` comparisons
 40 |   /// per row.
 41 |   ///
 42 |   /// This hash algorithm is as fast or faster than Mean (because it only traverses the
 43 |   /// hash data once) and is more resistant to changes than Mean.
 44 |   ///
 45 |   /// Further Reading:
 46 |   /// http://www.hackerfactor.com/blog/index.php?/archives/529-Kind-of-Like-That.html
 47 |   Gradient,
 48 | 
 49 |   /// The Vertical-Gradient hashing algorithm.
 50 |   ///
 51 |   /// Equivalent to [`Gradient`](#variant.Gradient) but operating on the columns of the image
 52 |   /// instead of the rows.
 53 |   VertGradient,
 54 | 
 55 |   /// The Double-Gradient hashing algorithm.
 56 |   ///
 57 |   /// An advanced version of [`Gradient`](#variant.Gradient);
 58 |   /// resizes the grayscaled image to `(width / 2 + 1) x (height / 2 + 1)` and compares columns
 59 |   /// in addition to rows.
 60 |   ///
 61 |   /// This algorithm is slightly slower than `Gradient` (resizing the image dwarfs
 62 |   /// the hash time in most cases) but the extra comparison direction may improve results (though
 63 |   /// you might want to consider increasing
 64 |   /// [`hash_size`](struct.HasherConfig.html#method.hash_size)
 65 |   /// to accommodate the extra comparisons).
 66 |   DoubleGradient,
 67 | 
 68 |   /// The [Blockhash.io](https://blockhash.io) algorithm.
 69 |   ///
 70 |   /// Compared to the other algorithms, this does not require any preprocessing steps and so
 71 |   /// may be significantly faster at the cost of some resilience.
 72 |   ///
 73 |   /// The algorithm is described in a high level here:
 74 |   /// https://github.com/commonsmachinery/blockhash-rfc/blob/master/main.md
 75 |   Blockhash,
 76 | }
 77 | 
 78 | fn next_multiple_of_2(x: u32) -> u32 {
 79 |   (x + 1) & !1
 80 | }
 81 | 
 82 | fn next_multiple_of_4(x: u32) -> u32 {
 83 |   (x + 3) & !3
 84 | }
 85 | 
 86 | impl HashAlg {
 87 |   pub(crate) fn hash_image<I, B>(&self, ctxt: &HashCtxt, image: &I) -> B
 88 |   where
 89 |     I: Image,
 90 |     B: BitSet,
 91 |   {
 92 |     let post_gauss = ctxt.gauss_preproc(image);
 93 | 
 94 |     let HashCtxt { width, height, .. } = *ctxt;
 95 | 
 96 |     if *self == Blockhash {
 97 |       return match post_gauss {
 98 |         Borrowed(img) => blockhash::blockhash(img, width, height),
 99 |         Owned(img) => blockhash::blockhash(&img, width, height),
100 |       };
101 |     }
102 | 
103 |     let grayscale = post_gauss.to_grayscale();
104 |     let (resize_width, resize_height) = self.resize_dimensions(width, height);
105 | 
106 |     let hash_vals = ctxt.calc_hash_vals(&grayscale, resize_width, resize_height);
107 | 
108 |     let rowstride = resize_width as usize;
109 | 
110 |     match (*self, hash_vals) {
111 |       (Mean, Floats(ref floats)) => B::from_bools(mean_hash_f32(floats)),
112 |       (Mean, Bytes(ref bytes)) => B::from_bools(mean_hash_u8(bytes)),
113 |       (Gradient, Floats(ref floats)) => B::from_bools(gradient_hash(floats, rowstride)),
114 |       (Gradient, Bytes(ref bytes)) => B::from_bools(gradient_hash(bytes, rowstride)),
115 |       (VertGradient, Floats(ref floats)) => B::from_bools(vert_gradient_hash(floats, rowstride)),
116 |       (VertGradient, Bytes(ref bytes)) => B::from_bools(vert_gradient_hash(bytes, rowstride)),
117 |       (DoubleGradient, Floats(ref floats)) => {
118 |         B::from_bools(double_gradient_hash(floats, rowstride))
119 |       }
120 |       (DoubleGradient, Bytes(ref bytes)) => B::from_bools(double_gradient_hash(bytes, rowstride)),
121 |       (Blockhash, _) => unreachable!(),
122 |     }
123 |   }
124 | 
125 |   pub(crate) fn round_hash_size(&self, width: u32, height: u32) -> (u32, u32) {
126 |     match *self {
127 |       DoubleGradient => (next_multiple_of_2(width), next_multiple_of_2(height)),
128 |       Blockhash => (next_multiple_of_4(width), next_multiple_of_4(height)),
129 |       _ => (width, height),
130 |     }
131 |   }
132 | 
133 |   pub(crate) fn resize_dimensions(&self, width: u32, height: u32) -> (u32, u32) {
134 |     match *self {
135 |       Mean => (width, height),
136 |       Blockhash => panic!("Blockhash algorithm does not resize"),
137 |       Gradient => (width + 1, height),
138 |       VertGradient => (width, height + 1),
139 |       DoubleGradient => (width / 2 + 1, height / 2 + 1),
140 |     }
141 |   }
142 | }
143 | 
144 | fn mean_hash_u8<'a>(luma: &'a [u8]) -> impl Iterator<Item = bool> + 'a {
145 |   let mean = (luma.iter().map(|&l| l as u32).sum::<u32>() / luma.len() as u32) as u8;
146 |   luma.iter().map(move |&x| x >= mean)
147 | }
148 | 
149 | fn mean_hash_f32<'a>(luma: &'a [f32]) -> impl Iterator<Item = bool> + 'a {
150 |   let mean = luma.iter().sum::<f32>() / luma.len() as f32;
151 |   luma.iter().map(move |&x| x >= mean)
152 | }
153 | 
154 | /// The guts of the gradient hash separated so we can reuse them
155 | fn gradient_hash_impl<I>(luma: I) -> impl Iterator<Item = bool>
156 | where
157 |   I: IntoIterator + Clone,
158 |   <I as IntoIterator>::Item: PartialOrd,
159 | {
160 |   luma
161 |     .clone()
162 |     .into_iter()
163 |     .skip(1)
164 |     .zip(luma)
165 |     .map(|(this, last)| last < this)
166 | }
167 | 
168 | fn gradient_hash<'a, T: PartialOrd>(
169 |   luma: &'a [T],
170 |   rowstride: usize,
171 | ) -> impl Iterator<Item = bool> + 'a {
172 |   luma.chunks(rowstride).flat_map(gradient_hash_impl)
173 | }
174 | 
175 | fn vert_gradient_hash<'a, T: PartialOrd>(
176 |   luma: &'a [T],
177 |   rowstride: usize,
178 | ) -> impl Iterator<Item = bool> + 'a {
179 |   (0..rowstride)
180 |     .map(move |col_start| luma[col_start..].iter().step_by(rowstride))
181 |     .flat_map(gradient_hash_impl)
182 | }
183 | 
184 | fn double_gradient_hash<'a, T: PartialOrd>(
185 |   luma: &'a [T],
186 |   rowstride: usize,
187 | ) -> impl Iterator<Item = bool> + 'a {
188 |   gradient_hash(luma, rowstride).chain(vert_gradient_hash(luma, rowstride))
189 | }
190 | 


--------------------------------------------------------------------------------
/img_hash/src/bin/hash_image.rs:
--------------------------------------------------------------------------------
 1 | //! Hash an image and print the Base64 value
 2 | 
 3 | use std::env;
 4 | 
 5 | use image_hasher::HasherConfig;
 6 | 
 7 | fn main() -> Result<(), String> {
 8 |   let args = env::args().collect::<Vec<_>>();
 9 |   assert_eq!(args.len(), 2);
10 | 
11 |   let image = image::open(&args[1]).map_err(|e| format!("failed to open {}: {}", &args[1], e))?;
12 | 
13 |   let hash = HasherConfig::new()
14 |     .hash_size(8, 8)
15 |     .to_hasher()
16 |     .hash_image(&image);
17 | 
18 |   let hash_str = hash
19 |     .as_bytes()
20 |     .iter()
21 |     .map(|b| format!("{b:02x}"))
22 |     .collect::<String>();
23 | 
24 |   println!("{}: {}", &args[1], hash_str);
25 | 
26 |   Ok(())
27 | }
28 | 


--------------------------------------------------------------------------------
/img_hash/src/dct.rs:
--------------------------------------------------------------------------------
  1 | use std::sync::Arc;
  2 | 
  3 | use rustdct::{DctPlanner, TransformType2And3};
  4 | use transpose::transpose_inplace;
  5 | 
  6 | pub const SIZE_MULTIPLIER: u32 = 2;
  7 | pub const SIZE_MULTIPLIER_U: usize = SIZE_MULTIPLIER as usize;
  8 | 
  9 | pub struct DctCtxt {
 10 |   row_dct: Arc<dyn TransformType2And3<f32>>,
 11 |   col_dct: Arc<dyn TransformType2And3<f32>>,
 12 |   width: usize,
 13 |   height: usize,
 14 | }
 15 | 
 16 | impl DctCtxt {
 17 |   pub fn new(width: u32, height: u32) -> Self {
 18 |     let mut planner = DctPlanner::new();
 19 |     let width = width as usize * SIZE_MULTIPLIER_U;
 20 |     let height = height as usize * SIZE_MULTIPLIER_U;
 21 | 
 22 |     DctCtxt {
 23 |       row_dct: planner.plan_dct2(width),
 24 |       col_dct: planner.plan_dct2(height),
 25 |       width,
 26 |       height,
 27 |     }
 28 |   }
 29 | 
 30 |   pub fn width(&self) -> u32 {
 31 |     self.width as u32
 32 |   }
 33 | 
 34 |   pub fn height(&self) -> u32 {
 35 |     self.height as u32
 36 |   }
 37 | 
 38 |   /// Perform a 2D DCT on a 1D-packed vector with a given `width x height`.
 39 |   ///
 40 |   /// Assumes `packed_2d` is double-length for scratch space. Returns the vector truncated to
 41 |   /// `width * height`.
 42 |   ///
 43 |   /// ### Panics
 44 |   /// If `self.width * self.height * 2 != packed_2d.len()`
 45 |   pub fn dct_2d(&self, mut packed_2d: Vec<f32>) -> Vec<f32> {
 46 |     let Self {
 47 |       ref row_dct,
 48 |       ref col_dct,
 49 |       width,
 50 |       height,
 51 |     } = *self;
 52 | 
 53 |     let trunc_len = width * height;
 54 |     assert_eq!(trunc_len + self.required_scratch(), packed_2d.len());
 55 | 
 56 |     {
 57 |       let (packed_2d, scratch) = packed_2d.split_at_mut(trunc_len);
 58 | 
 59 |       for row_in in packed_2d.chunks_mut(width) {
 60 |         row_dct.process_dct2_with_scratch(row_in, scratch);
 61 |       }
 62 | 
 63 |       transpose_inplace(
 64 |         packed_2d,
 65 |         &mut scratch[..std::cmp::max(width, height)],
 66 |         width,
 67 |         height,
 68 |       );
 69 | 
 70 |       for row_in in packed_2d.chunks_mut(height) {
 71 |         col_dct.process_dct2_with_scratch(row_in, scratch);
 72 |       }
 73 | 
 74 |       transpose_inplace(
 75 |         packed_2d,
 76 |         &mut scratch[..std::cmp::max(width, height)],
 77 |         width,
 78 |         height,
 79 |       );
 80 |     }
 81 | 
 82 |     packed_2d.truncate(trunc_len);
 83 |     packed_2d
 84 |   }
 85 | 
 86 |   pub fn crop_2d(&self, packed: Vec<f32>) -> Vec<f32> {
 87 |     crop_2d_dct(packed, self.width)
 88 |   }
 89 | 
 90 |   pub fn required_scratch(&self) -> usize {
 91 |     let transpose_scratch = std::cmp::max(self.width, self.height);
 92 |     let dct_scratch = std::cmp::max(
 93 |       self.row_dct.get_scratch_len(),
 94 |       self.col_dct.get_scratch_len(),
 95 |     );
 96 |     std::cmp::max(transpose_scratch, dct_scratch)
 97 |   }
 98 | }
 99 | 
100 | /// Crop the values off a 1D-packed 2D DCT.
101 | ///
102 | /// Returns `packed` truncated to the premultiplied size, as determined by `rowstride`
103 | ///
104 | /// Generic for easier testing
105 | fn crop_2d_dct<T: Copy>(mut packed: Vec<T>, rowstride: usize) -> Vec<T> {
106 |   // assert that the rowstride was previously multiplied by SIZE_MULTIPLIER
107 |   assert_eq!(rowstride % SIZE_MULTIPLIER_U, 0);
108 |   assert!(
109 |     rowstride / SIZE_MULTIPLIER_U > 0,
110 |     "rowstride cannot be cropped: {rowstride}",
111 |   );
112 | 
113 |   let new_rowstride = rowstride / SIZE_MULTIPLIER_U;
114 | 
115 |   for new_row in 0..packed.len() / (rowstride * SIZE_MULTIPLIER_U) {
116 |     let (dest, src) = packed.split_at_mut(new_row * new_rowstride + rowstride);
117 |     let dest_start = dest.len() - new_rowstride;
118 |     let src_start = new_rowstride * new_row;
119 |     let src_end = src_start + new_rowstride;
120 |     dest[dest_start..].copy_from_slice(&src[src_start..src_end]);
121 |   }
122 | 
123 |   let new_len = packed.len() / (SIZE_MULTIPLIER_U * SIZE_MULTIPLIER_U);
124 |   packed.truncate(new_len);
125 | 
126 |   packed
127 | }
128 | 
129 | #[test]
130 | fn test_crop_2d_dct() {
131 |   let packed: Vec<i32> = (0..64).collect();
132 |   assert_eq!(
133 |     crop_2d_dct(packed.clone(), 8),
134 |     [
135 |       0, 1, 2, 3, // 4, 5, 6, 7
136 |       8, 9, 10, 11, // 12, 13, 14, 15
137 |       16, 17, 18, 19, // 20, 21, 22, 23,
138 |       24, 25, 26, 27, // 28, 29, 30, 31,
139 |           // 32 .. 64
140 |     ]
141 |   );
142 | }
143 | 
144 | #[test]
145 | fn test_transpose() {}
146 | 


--------------------------------------------------------------------------------
/img_hash/src/fr.rs:
--------------------------------------------------------------------------------
 1 | use std::num::NonZeroU32;
 2 | 
 3 | use fast_image_resize as fr;
 4 | pub use fr::FilterType;
 5 | use image::GrayImage;
 6 | 
 7 | pub fn resize_gray(image: &GrayImage, width: u32, height: u32, filter: FilterType) -> GrayImage {
 8 |   let src_view: fr::ImageView<'_, fr::pixels::U8> = fr::ImageView::from_buffer(
 9 |     NonZeroU32::new(image.width()).unwrap(),
10 |     NonZeroU32::new(image.height()).unwrap(),
11 |     image.as_raw(),
12 |   )
13 |   .unwrap();
14 |   let src_view = fr::DynamicImageView::from(src_view);
15 | 
16 |   let mut dst_img = fr::Image::new(
17 |     NonZeroU32::new(width).unwrap(),
18 |     NonZeroU32::new(height).unwrap(),
19 |     fr::PixelType::U8,
20 |   );
21 | 
22 |   let mut dst_view = dst_img.view_mut();
23 | 
24 |   let mut resizer = fr::Resizer::new(fr::ResizeAlg::Convolution(filter));
25 |   resizer.resize(&src_view, &mut dst_view).unwrap();
26 | 
27 |   image::GrayImage::from_vec(
28 |     dst_img.width().get(),
29 |     dst_img.height().get(),
30 |     dst_img.into_vec(),
31 |   )
32 |   .unwrap()
33 | }
34 | 


--------------------------------------------------------------------------------
/img_hash/src/traits.rs:
--------------------------------------------------------------------------------
  1 | use std::borrow::Cow;
  2 | use std::ops;
  3 | 
  4 | use image::{imageops, DynamicImage, GenericImageView, GrayImage, ImageBuffer, Pixel};
  5 | 
  6 | /// Interface for types used for storing hash data.
  7 | ///
  8 | /// This is implemented for `Vec<u8>`, `Box<[u8]>` and arrays that are multiples/combinations of
  9 | /// useful x86 bytewise SIMD register widths (64, 128, 256, 512 bits).
 10 | ///
 11 | /// Please feel free to open a pull request [on Github](https://github.com/qarmin/img_hash)
 12 | /// if you need this implemented for a different array size.
 13 | pub trait HashBytes {
 14 |   /// Construct this type from an iterator of bytes.
 15 |   ///
 16 |   /// If this type has a finite capacity (i.e. an array) then it can ignore extra data
 17 |   /// (the hash API will not create a hash larger than this type can contain). Unused capacity
 18 |   /// **must** be zeroed.
 19 |   fn from_iter<I: Iterator<Item = u8>>(iter: I) -> Self
 20 |   where
 21 |     Self: Sized;
 22 | 
 23 |   /// Return the maximum capacity of this type, in bits.
 24 |   ///
 25 |   /// If this type has an arbitrary/theoretically infinite capacity, return `usize::max_value()`.
 26 |   fn max_bits() -> usize;
 27 | 
 28 |   /// Get the hash bytes as a slice.
 29 |   fn as_slice(&self) -> &[u8];
 30 | }
 31 | 
 32 | impl HashBytes for Box<[u8]> {
 33 |   fn from_iter<I: Iterator<Item = u8>>(iter: I) -> Self {
 34 |     // stable in 1.32, effectively the same thing
 35 |     // iter.collect()
 36 |     iter.collect::<Vec<u8>>().into_boxed_slice()
 37 |   }
 38 | 
 39 |   fn max_bits() -> usize {
 40 |     usize::MAX
 41 |   }
 42 | 
 43 |   fn as_slice(&self) -> &[u8] {
 44 |     self
 45 |   }
 46 | }
 47 | 
 48 | impl HashBytes for Vec<u8> {
 49 |   fn from_iter<I: Iterator<Item = u8>>(iter: I) -> Self {
 50 |     iter.collect()
 51 |   }
 52 | 
 53 |   fn max_bits() -> usize {
 54 |     usize::MAX
 55 |   }
 56 | 
 57 |   fn as_slice(&self) -> &[u8] {
 58 |     self
 59 |   }
 60 | }
 61 | 
 62 | macro_rules! hash_bytes_array {
 63 |     ($($n:expr),*) => {$(
 64 |         impl HashBytes for [u8; $n] {
 65 |             fn from_iter<I: Iterator<Item=u8>>(mut iter: I) -> Self {
 66 |                 // optimizer should eliminate this zeroing
 67 |                 let mut out = [0; $n];
 68 | 
 69 |                 for (src, dest) in iter.by_ref().zip(out.as_mut()) {
 70 |                     *dest = src;
 71 |                 }
 72 | 
 73 |                 out
 74 |             }
 75 | 
 76 |             fn max_bits() -> usize {
 77 |                 $n * 8
 78 |             }
 79 | 
 80 |             fn as_slice(&self) -> &[u8] { self }
 81 |         }
 82 |     )*}
 83 | }
 84 | 
 85 | hash_bytes_array!(8, 16, 24, 32, 40, 48, 56, 64);
 86 | 
 87 | struct BoolsToBytes<I> {
 88 |   iter: I,
 89 | }
 90 | 
 91 | impl<I> Iterator for BoolsToBytes<I>
 92 | where
 93 |   I: Iterator<Item = bool>,
 94 | {
 95 |   type Item = u8;
 96 | 
 97 |   fn next(&mut self) -> Option<<Self as Iterator>::Item> {
 98 |     // starts at the LSB and works up
 99 |     self
100 |       .iter
101 |       .by_ref()
102 |       .take(8)
103 |       .enumerate()
104 |       .fold(None, |accum, (n, val)| {
105 |         accum.or(Some(0)).map(|accum| accum | ((val as u8) << n))
106 |       })
107 |   }
108 | 
109 |   fn size_hint(&self) -> (usize, Option<usize>) {
110 |     let (lower, upper) = self.iter.size_hint();
111 |     (
112 |       lower / 8,
113 |       // if the upper bound doesn't evenly divide by `8` then we will yield an extra item
114 |       upper.map(|upper| {
115 |         if upper % 8 == 0 {
116 |           upper / 8
117 |         } else {
118 |           upper / 8 + 1
119 |         }
120 |       }),
121 |     )
122 |   }
123 | }
124 | 
125 | pub(crate) trait BitSet: HashBytes {
126 |   fn from_bools<I: Iterator<Item = bool>>(iter: I) -> Self
127 |   where
128 |     Self: Sized,
129 |   {
130 |     Self::from_iter(BoolsToBytes { iter })
131 |   }
132 | 
133 |   fn hamming(&self, other: &Self) -> u32 {
134 |     self
135 |       .as_slice()
136 |       .iter()
137 |       .zip(other.as_slice())
138 |       .map(|(l, r)| (l ^ r).count_ones())
139 |       .sum()
140 |   }
141 | }
142 | 
143 | impl<T: HashBytes> BitSet for T {}
144 | 
145 | /// Shorthand trait bound for APIs in this crate.
146 | ///
147 | /// Currently only implemented for the types provided by `image` with 8-bit channels.
148 | pub trait Image: GenericImageView + 'static {
149 |   /// The equivalent `ImageBuffer` type for this container.
150 |   type Buf: Image + DiffImage;
151 | 
152 |   /// Grayscale the image, reducing to 8 bit depth and dropping the alpha channel.
153 |   fn to_grayscale(&self) -> Cow<GrayImage>;
154 | 
155 |   /// Blur the image with the given `Gaussian` sigma.
156 |   fn blur(&self, sigma: f32) -> Self::Buf;
157 | 
158 |   /// Iterate over the image, passing each pixel's coordinates and values in `u8` to the closure.
159 |   ///
160 |   /// The iteration order is unspecified but each pixel **must** be visited exactly _once_.
161 |   ///
162 |   /// If the pixel's channels are wider than 8 bits then the values should be scaled to
163 |   /// `[0, 255]`, not truncated.
164 |   ///
165 |   /// ### Note
166 |   /// If the pixel data length is 2 or 4, the last index is assumed to be the alpha channel.
167 |   /// A pixel data length outside of `[1, 4]` will cause a panic.
168 |   fn foreach_pixel8<F>(&self, foreach: F)
169 |   where
170 |     F: FnMut(u32, u32, &[u8]);
171 | }
172 | 
173 | /// Image types that can be diffed.
174 | pub trait DiffImage {
175 |   /// Subtract the pixel values of `other` from `self` in-place.
176 |   fn diff_inplace(&mut self, other: &Self);
177 | }
178 | 
179 | #[cfg(not(feature = "nightly"))]
180 | impl<P: 'static, C: 'static> Image for ImageBuffer<P, C>
181 | where
182 |   P: Pixel<Subpixel = u8>,
183 |   C: ops::Deref<Target = [u8]>,
184 | {
185 |   type Buf = ImageBuffer<P, Vec<u8>>;
186 | 
187 |   fn to_grayscale(&self) -> Cow<GrayImage> {
188 |     Cow::Owned(imageops::grayscale(self))
189 |   }
190 | 
191 |   fn blur(&self, sigma: f32) -> Self::Buf {
192 |     imageops::blur(self, sigma)
193 |   }
194 | 
195 |   fn foreach_pixel8<F>(&self, mut foreach: F)
196 |   where
197 |     F: FnMut(u32, u32, &[u8]),
198 |   {
199 |     self
200 |       .enumerate_pixels()
201 |       .for_each(|(x, y, px)| foreach(x, y, px.channels()));
202 |   }
203 | }
204 | 
205 | #[cfg(feature = "nightly")]
206 | impl<P: 'static, C: 'static> Image for ImageBuffer<P, C>
207 | where
208 |   P: Pixel<Subpixel = u8>,
209 |   C: ops::Deref<Target = [u8]>,
210 | {
211 |   type Buf = ImageBuffer<P, Vec<u8>>;
212 | 
213 |   default fn to_grayscale(&self) -> Cow<GrayImage> {
214 |     Cow::Owned(imageops::grayscale(self))
215 |   }
216 | 
217 |   default fn blur(&self, sigma: f32) -> Self::Buf {
218 |     imageops::blur(self, sigma)
219 |   }
220 | 
221 |   default fn foreach_pixel8<F>(&self, mut foreach: F)
222 |   where
223 |     F: FnMut(u32, u32, &[u8]),
224 |   {
225 |     self
226 |       .enumerate_pixels()
227 |       .for_each(|(x, y, px)| foreach(x, y, px.channels()))
228 |   }
229 | }
230 | 
231 | impl<P: 'static> DiffImage for ImageBuffer<P, Vec<u8>>
232 | where
233 |   P: Pixel<Subpixel = u8>,
234 | {
235 |   fn diff_inplace(&mut self, other: &Self) {
236 |     self.iter_mut().zip(other.iter()).for_each(|(l, r)| {
237 |       *l = l.wrapping_sub(*r);
238 |     });
239 |   }
240 | }
241 | 
242 | impl Image for DynamicImage {
243 |   type Buf = image::RgbaImage;
244 | 
245 |   fn to_grayscale(&self) -> Cow<GrayImage> {
246 |     self
247 |       .as_luma8()
248 |       .map_or_else(|| Cow::Owned(self.to_luma8()), Cow::Borrowed)
249 |   }
250 | 
251 |   fn blur(&self, sigma: f32) -> Self::Buf {
252 |     imageops::blur(self, sigma)
253 |   }
254 | 
255 |   fn foreach_pixel8<F>(&self, mut foreach: F)
256 |   where
257 |     F: FnMut(u32, u32, &[u8]),
258 |   {
259 |     self
260 |       .pixels()
261 |       .for_each(|(x, y, px)| foreach(x, y, px.channels()));
262 |   }
263 | }
264 | 
265 | #[cfg(feature = "nightly")]
266 | impl Image for GrayImage {
267 |   // type Buf = GrayImage;
268 | 
269 |   // Avoids copying
270 |   fn to_grayscale(&self) -> Cow<GrayImage> {
271 |     Cow::Borrowed(self)
272 |   }
273 | }
274 | 
275 | #[test]
276 | fn test_bools_to_bytes() {
277 |   let bools = (0..16).map(|x| x & 1 == 0);
278 |   let bytes = Vec::from_bools(bools.clone());
279 |   assert_eq!(*bytes, [0b01010101; 2]);
280 | 
281 |   let bools_to_bytes = BoolsToBytes { iter: bools };
282 |   assert_eq!(bools_to_bytes.size_hint(), (2, Some(2)));
283 | }
284 | 


--------------------------------------------------------------------------------
/migrations/0000_init.sql:
--------------------------------------------------------------------------------
 1 | -- Migration number: 0000 	 2023-07-09T09:49:35.518Z
 2 | 
 3 | CREATE TABLE IF NOT EXISTS source_image (
 4 |   id TEXT PRIMARY KEY,
 5 |   hash TEXT NOT NULL,
 6 |   file TEXT NOT NULL UNIQUE,
 7 |   width INTEGER NOT NULL,
 8 |   height INTEGER NOT NULL,
 9 |   dummy INTEGER NOT NULL DEFAULT 0,
10 |   created_at DATETIME DEFAULT CURRENT_TIMESTAMP,
11 |   updated_at DATETIME DEFAULT CURRENT_TIMESTAMP
12 | );
13 | 
14 | CREATE TRIGGER update_source_updated_at
15 | AFTER UPDATE OF id, hash, file, width, height ON source_image
16 | FOR EACH ROW
17 | BEGIN
18 |   UPDATE source_image SET updated_at = CURRENT_TIMESTAMP WHERE id = NEW.id;
19 | END;
20 | 
21 | CREATE TABLE IF NOT EXISTS task (
22 |   id TEXT PRIMARY_KEY,
23 |   source_image_id TEXT NOT NULL,
24 |   target_language INTEGER NOT NULL,
25 |   detector INTEGER NOT NULL,
26 |   direction INTEGER NOT NULL,
27 |   translator INTEGER NOT NULL,
28 |   size INTEGER NOT NULL,
29 |   state INTEGER NOT NULL DEFAULT 1,
30 |   last_attempted_at DATETIME,
31 |   worker_revision INTEGER NOT NULL DEFAULT 0,
32 |   failed_count INTEGER NOT NULL DEFAULT 0,
33 |   translation_mask TEXT,
34 |   dummy INTEGER NOT NULL DEFAULT 0,
35 |   created_at DATETIME DEFAULT CURRENT_TIMESTAMP,
36 |   updated_at DATETIME DEFAULT CURRENT_TIMESTAMP
37 | );
38 | 
39 | CREATE TRIGGER update_task_updated_at
40 | AFTER UPDATE OF id, source_image_id, target_language, detector, direction, translator, size, state, last_attempted_at, worker_revision, failed_count, translation_mask ON task
41 | FOR EACH ROW
42 | BEGIN
43 |   UPDATE task SET updated_at = CURRENT_TIMESTAMP WHERE id = NEW.id;
44 | END;
45 | 
46 | CREATE UNIQUE INDEX ix_task_source_params_revision ON task (source_image_id, target_language, detector, direction, translator, size, worker_revision);
47 | 


--------------------------------------------------------------------------------
/migrations/0001_source_size.sql:
--------------------------------------------------------------------------------
1 | -- Migration number: 0001 	 2023-07-14T15:12:56.498Z
2 | 
3 | ALTER TABLE source_image ADD COLUMN size INTEGER NOT NULL;
4 | 


--------------------------------------------------------------------------------
/migrations/0002_source_size_trigger.sql:
--------------------------------------------------------------------------------
 1 | -- Migration number: 0002 	 2023-07-14T20:52:24.994Z
 2 | 
 3 | DROP TRIGGER IF EXISTS update_source_updated_at;
 4 | 
 5 | CREATE TRIGGER update_source_updated_at
 6 | AFTER UPDATE OF id, hash, file, size, width, height ON source_image
 7 | FOR EACH ROW
 8 | BEGIN
 9 |   UPDATE source_image SET updated_at = CURRENT_TIMESTAMP WHERE id = NEW.id;
10 | END;
11 | 


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "private": true,
 3 |   "scripts": {
 4 |     "lint": "eslint .",
 5 |     "build": "pnpm run -r build"
 6 |   },
 7 |   "devDependencies": {
 8 |     "@antfu/eslint-config": "^0.39.8",
 9 |     "eslint": "^8.45.0",
10 |     "typescript": "^5.1.6"
11 |   }
12 | }
13 | 


--------------------------------------------------------------------------------
/pnpm-workspace.yaml:
--------------------------------------------------------------------------------
1 | packages:
2 |   - web
3 |   - web-ext
4 |   - userscript
5 |   - wk-gateway
6 |   - wkr2
7 |   - types
8 | 


--------------------------------------------------------------------------------
/proto-rs/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "cotrans-proto-rs"
 3 | version = "0.1.5"
 4 | edition.workspace = true
 5 | rust-version.workspace = true
 6 | publish = false
 7 | 
 8 | # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 9 | 
10 | [dependencies]
11 | prost = "0.11.9"
12 | prost-types = "0.11.9"
13 | 
14 | [build-dependencies]
15 | prost-build = "0.11.9"
16 | 


--------------------------------------------------------------------------------
/proto-rs/build.rs:
--------------------------------------------------------------------------------
1 | use std::io::Result;
2 | fn main() -> Result<()> {
3 |   prost_build::compile_protos(&["../proto/gateway.mit.proto"], &["../proto"])?;
4 |   Ok(())
5 | }
6 | 


--------------------------------------------------------------------------------
/proto-rs/src/lib.rs:
--------------------------------------------------------------------------------
1 | pub mod gateway {
2 |   pub mod mit {
3 |     include!(concat!(env!("OUT_DIR"), "/gateway.mit.rs"));
4 |   }
5 | }
6 | 


--------------------------------------------------------------------------------
/proto/gateway.mit.proto:
--------------------------------------------------------------------------------
 1 | syntax = "proto3";
 2 | 
 3 | package gateway.mit;
 4 | 
 5 | message NewTask {
 6 |   string id = 1;
 7 | 
 8 |   string source_image = 2;
 9 | 
10 |   string target_language = 3;
11 |   string detector = 4;
12 |   string direction = 5;
13 |   string translator = 6;
14 |   string size = 7;
15 | 
16 |   string translation_mask = 8;
17 | }
18 | 
19 | message Status {
20 |   string id = 1;
21 |   string status = 2;
22 | }
23 | 
24 | message FinishTask {
25 |   string id = 1;
26 |   bool success = 2;
27 |   bool has_translation_mask = 3;
28 | }
29 | 
30 | message WebSocketMessage {
31 |   oneof message {
32 |     NewTask new_task = 1;
33 |     Status status = 2;
34 |     FinishTask finish_task = 3;
35 |   }
36 | }
37 | 


--------------------------------------------------------------------------------
/rust-toolchain.toml:
--------------------------------------------------------------------------------
1 | [toolchain]
2 | channel = "nightly"
3 | 


--------------------------------------------------------------------------------
/rustfmt.toml:
--------------------------------------------------------------------------------
1 | tab_spaces = 2
2 | 


--------------------------------------------------------------------------------
/services/inpainting_lama_v1/main.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Any
 3 | from models import *
 4 | from inpainting import load_model, run_inpainting
 5 | 
 6 | import numpy as np
 7 | from PIL import Image
 8 | import io
 9 | import cv2
10 | import secrets
11 | 
12 | from fastapi import FastAPI, Form, File, UploadFile, Response
13 | from fastapi.responses import StreamingResponse
14 | 
15 | app = FastAPI()
16 | 
17 | class JsonAndImageResponse(Response) :
18 | 	def render(self, content: Any) -> bytes:
19 | 		boundary = secrets.token_bytes(16).hex()
20 | 		json_data: dict = content["json"]
21 | 		img_data: Image.Image = content["img"]
22 | 		img_type: str = content["img-type"]
23 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"jsonData\";"
24 | 		json_content = json.dumps(json_data)
25 | 		ans = io.BytesIO()
26 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
27 | 		ans.write(b"Content-Type: application/json\r\nContent-ID: jsonData\r\n\r\n")
28 | 		ans.write(json_content.encode('utf-8'))
29 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
30 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
31 | 		img_data.save(ans, format = 'PNG')
32 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
33 | 		return ans.getvalue()
34 | 
35 | @app.post("/v1/inpaint")
36 | async def inpaint(config: V1InapintingLamaRequest = Form(), image: UploadFile = File(), mask: UploadFile = File()) :
37 | 	img = Image.open(image.file)
38 | 	img_np = np.asarray(img)
39 | 	mask = Image.open(mask.file)
40 | 	mask_np = np.asarray(mask)
41 | 	if image.shape[:2] != mask.shape[:2] :
42 | 		raise ValueError(f'Image size (={image.shape[:2]}) must be the same as mask size (={mask.shape[:2]})')
43 | 	if len(mask_np.shape) != 2 :
44 | 		if mask_np.shape[-1] == 3 :
45 | 			mask_np = mask_np[:, :, 0]
46 | 	inpainted_img_np, version = run_inpainting(app, config, img_np, mask_np)
47 | 	resp = V1InapintingLamaResponse(version = version)
48 | 	return JsonAndImageResponse({"json": resp.dict(), "img": Image.fromarray(inpainted_img_np), "img-type": "png"})
49 | 
50 | @app.on_event("startup")
51 | async def startup_event() :
52 | 	load_model(app)
53 | 


--------------------------------------------------------------------------------
/services/inpainting_lama_v1/models.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Optional
 3 | from pydantic import BaseModel, ValidationError, validator
 4 | 
 5 | import json
 6 | 
 7 | class V1InapintingLamaRequest(BaseModel) :
 8 |     use_poisson_blending: bool = False
 9 |     cuda: bool = False
10 |     inpainting_size: int = 1024
11 | 
12 |     @classmethod
13 |     def __get_validators__(cls):
14 |         yield cls.validate_to_json
15 | 
16 |     @classmethod
17 |     def validate_to_json(cls, value):
18 |         if isinstance(value, str):
19 |             return cls(**json.loads(value))
20 |         return value
21 | 
22 |     @validator("inpainting_size")
23 |     def divisible_by_pad_size(cls, v) :
24 |         pad_size = 8
25 |         if v % pad_size != 0 :
26 |             raise ValueError(f'inpainting_size(={v}) must be divisible by {pad_size}')
27 |         return v
28 | 
29 | class V1InapintingLamaResponse(BaseModel) :
30 |     version: str
31 | 
32 |     @classmethod
33 |     def __get_validators__(cls):
34 |         yield cls.validate_to_json
35 | 
36 |     @classmethod
37 |     def validate_to_json(cls, value):
38 |         if isinstance(value, str):
39 |             return cls(**json.loads(value))
40 |         return value
41 |         


--------------------------------------------------------------------------------
/services/mask_refinement_v1/main.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Any
 3 | from models import *
 4 | from text_mask_utils import run_refine_mask
 5 | 
 6 | import numpy as np
 7 | from PIL import Image
 8 | import io
 9 | import cv2
10 | import secrets
11 | 
12 | from fastapi import FastAPI, Form, File, UploadFile, Response
13 | app = FastAPI()
14 | 
15 | class JsonAndImageResponse(Response) :
16 | 	def render(self, content: Any) -> bytes:
17 | 		boundary = secrets.token_bytes(16).hex()
18 | 		json_data: dict = content["json"]
19 | 		img_data: Image.Image = content["img"]
20 | 		img_type: str = content["img-type"]
21 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"jsonData\";"
22 | 		json_content = json.dumps(json_data)
23 | 		ans = io.BytesIO()
24 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
25 | 		ans.write(b"Content-Type: application/json\r\nContent-ID: jsonData\r\n\r\n")
26 | 		ans.write(json_content.encode('utf-8'))
27 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
28 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
29 | 		img_data.save(ans, format = 'PNG')
30 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
31 | 		return ans.getvalue()
32 | 
33 | @app.post("/v1/refine")
34 | async def refine(config: V1MaskRefinementRequest = Form(), image: UploadFile = File(), mask: UploadFile = File()) :
35 | 	img = Image.open(image.file)
36 | 	img_np = np.asarray(img)
37 | 	mask = Image.open(mask.file)
38 | 	mask_np = np.asarray(mask)
39 | 	if img_np.shape[:2] != img_np.shape[:2] :
40 | 		raise ValueError(f'Image size (={img_np.shape[:2]}) must be the same as mask size (={img_np.shape[:2]})')
41 | 	if len(mask_np.shape) != 2 :
42 | 		if mask_np.shape[-1] == 3 :
43 | 			mask_np = mask_np[:, :, 0]
44 | 	textlines = [Quadrilateral.from_tref(t, img.width, img.height) for t in config.textlines]
45 | 	mask_np, version = run_refine_mask(img_np, mask_np, textlines, config.method)
46 | 	resp = V1MaskRefinementResponse(version = version)
47 | 	return JsonAndImageResponse({"json": resp.dict(exclude_none = True), "img": Image.fromarray(mask_np), "img-type": "png"})
48 | 


--------------------------------------------------------------------------------
/services/mask_refinement_v1/models.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from __future__ import annotations
 3 | from typing import List, Optional, Tuple
 4 | from pydantic import BaseModel
 5 | 
 6 | import json
 7 | 
 8 | class TextRegionExchangeFormat(BaseModel) :
 9 | 	fmt: str
10 | 	coords: str
11 | 	fg: Optional[Tuple[int, int, int]]
12 | 	bg: Optional[Tuple[int, int, int]]
13 | 	text: Optional[str]
14 | 	prob: Optional[float] = 0
15 | 	direction: Optional[str]
16 | 	lines: List[TextRegionExchangeFormat] = []
17 | 
18 | from utils import Quadrilateral
19 | 
20 | TextRegionExchangeFormat.update_forward_refs()
21 | 
22 | class V1MaskRefinementRequest(BaseModel) :
23 | 	method: str = 'fit_text'
24 | 	textlines: List[TextRegionExchangeFormat]
25 | 
26 | 	@classmethod
27 | 	def __get_validators__(cls):
28 | 		yield cls.validate_to_json
29 | 
30 | 	@classmethod
31 | 	def validate_to_json(cls, value):
32 | 		if isinstance(value, str):
33 | 			return cls(**json.loads(value))
34 | 		return value
35 | 
36 | class V1MaskRefinementResponse(BaseModel) :
37 | 	version: str
38 | 
39 | 	@classmethod
40 | 	def __get_validators__(cls):
41 | 		yield cls.validate_to_json
42 | 
43 | 	@classmethod
44 | 	def validate_to_json(cls, value):
45 | 		if isinstance(value, str):
46 | 			return cls(**json.loads(value))
47 | 		return value
48 | 


--------------------------------------------------------------------------------
/services/mask_refinement_v1/text_mask_utils.py:
--------------------------------------------------------------------------------
  1 | 
  2 | from typing import Tuple, List
  3 | import numpy as np
  4 | import cv2
  5 | import math
  6 | 
  7 | from tqdm import tqdm
  8 | from sklearn.mixture import BayesianGaussianMixture
  9 | from functools import reduce
 10 | from collections import defaultdict
 11 | from scipy.optimize import linear_sum_assignment
 12 | 
 13 | COLOR_RANGE_SIGMA = 1.5 # how many stddev away is considered the same color
 14 | 
 15 | def save_rgb(fn, img) :
 16 | 	if len(img.shape) == 3 and img.shape[2] == 3 :
 17 | 		cv2.imwrite(fn, cv2.cvtColor(img, cv2.COLOR_RGB2BGR))
 18 | 	else :
 19 | 		cv2.imwrite(fn, img)
 20 | 
 21 | def area(x1, y1, w1, h1, x2, y2, w2, h2):  # returns None if rectangles don't intersect
 22 | 	x_overlap = max(0, min(x1 + w1, x2 + w2) - max(x1, x2))
 23 | 	y_overlap = max(0, min(y1 + h1, y2 + h2) - max(y1, y2))
 24 | 	return x_overlap * y_overlap
 25 | 
 26 | def dist(x1, y1, x2, y2) :
 27 | 	return math.sqrt((x1 - x2) * (x1 - x2) + (y1 - y2) * (y1 - y2))
 28 | 
 29 | def rect_distance(x1, y1, x1b, y1b, x2, y2, x2b, y2b):
 30 | 	left = x2b < x1
 31 | 	right = x1b < x2
 32 | 	bottom = y2b < y1
 33 | 	top = y1b < y2
 34 | 	if top and left:
 35 | 		return dist(x1, y1b, x2b, y2)
 36 | 	elif left and bottom:
 37 | 		return dist(x1, y1, x2b, y2b)
 38 | 	elif bottom and right:
 39 | 		return dist(x1b, y1, x2, y2b)
 40 | 	elif right and top:
 41 | 		return dist(x1b, y1b, x2, y2)
 42 | 	elif left:
 43 | 		return x1 - x2b
 44 | 	elif right:
 45 | 		return x2 - x1b
 46 | 	elif bottom:
 47 | 		return y1 - y2b
 48 | 	elif top:
 49 | 		return y2 - y1b
 50 | 	else:             # rectangles intersect
 51 | 		return 0
 52 | 
 53 | def filter_masks(mask_img: np.ndarray, text_lines: List[Tuple[int, int, int, int]], keep_threshold = 1e-2) :
 54 | 	mask_img = mask_img.copy()
 55 | 	for (x, y, w, h) in text_lines :
 56 | 		cv2.rectangle(mask_img, (x, y), (x + w, y + h), (0), 1)
 57 | 	if len(text_lines) == 0 :
 58 | 		return [], []
 59 | 	num_labels, labels, stats, centroids = cv2.connectedComponentsWithStats(mask_img)
 60 | 
 61 | 	cc2textline_assignment = []
 62 | 	result = []
 63 | 	M = len(text_lines)
 64 | 	ratio_mat = np.zeros(shape = (num_labels, M), dtype = np.float32)
 65 | 	dist_mat = np.zeros(shape = (num_labels, M), dtype = np.float32)
 66 | 	for i in range(1, num_labels) :
 67 | 		if stats[i, cv2.CC_STAT_AREA] <= 9 :
 68 | 			continue # skip area too small
 69 | 		cc = np.zeros_like(mask_img)
 70 | 		cc[labels == i] = 255
 71 | 		x1, y1, w1, h1 = cv2.boundingRect(cc)
 72 | 		area1 = w1 * h1
 73 | 		for j in range(M) :
 74 | 			x2, y2, w2, h2 = text_lines[j]
 75 | 			area2 = w2 * h2
 76 | 			overlapping_area = area(x1, y1, w1, h1, x2, y2, w2, h2)
 77 | 			ratio_mat[i, j] = overlapping_area / min(area1, area2)
 78 | 			dist_mat[i, j] = rect_distance(x1, y1, x1 + w1, y1 + h1, x2, y2, x2 + w2, y2 + h2)
 79 | 		j = np.argmax(ratio_mat[i])
 80 | 		unit = min([h1, w1, h2, w2])
 81 | 		if ratio_mat[i, j] > keep_threshold :
 82 | 			cc2textline_assignment.append(j)
 83 | 			result.append(np.copy(cc))
 84 | 		else :
 85 | 			j = np.argmin(dist_mat[i])
 86 | 			if dist_mat[i, j] < 0.5 * unit :
 87 | 				cc2textline_assignment.append(j)
 88 | 				result.append(np.copy(cc))
 89 | 			else :
 90 | 				# discard
 91 | 				pass
 92 | 	return result, cc2textline_assignment
 93 | 
 94 | from pydensecrf.utils import compute_unary, unary_from_softmax
 95 | import pydensecrf.densecrf as dcrf
 96 | 
 97 | def refine_mask(rgbim, rawmask) :
 98 | 	if len(rawmask.shape) == 2 :
 99 | 		rawmask = rawmask[:, :, None]
100 | 	mask_softmax = np.concatenate([cv2.bitwise_not(rawmask)[:, :, None], rawmask], axis=2)
101 | 	mask_softmax = mask_softmax.astype(np.float32) / 255.0
102 | 	n_classes = 2
103 | 	feat_first = mask_softmax.transpose((2, 0, 1)).reshape((n_classes,-1))
104 | 	unary = unary_from_softmax(feat_first)
105 | 	unary = np.ascontiguousarray(unary)
106 | 
107 | 	d = dcrf.DenseCRF2D(rgbim.shape[1], rgbim.shape[0], n_classes)
108 | 
109 | 	d.setUnaryEnergy(unary)
110 | 	d.addPairwiseGaussian(sxy=1, compat=3, kernel=dcrf.DIAG_KERNEL,
111 | 							normalization=dcrf.NO_NORMALIZATION)
112 | 
113 | 	d.addPairwiseBilateral(sxy=23, srgb=7, rgbim=rgbim,
114 | 						compat=20,
115 | 						kernel=dcrf.DIAG_KERNEL,
116 | 						normalization=dcrf.NO_NORMALIZATION)
117 | 	Q = d.inference(5)
118 | 	res = np.argmax(Q, axis=0).reshape((rgbim.shape[0], rgbim.shape[1]))
119 | 	crf_mask = np.array(res * 255, dtype=np.uint8)
120 | 	return crf_mask
121 | 
122 | def complete_mask_fill(img_np: np.ndarray, ccs: List[np.ndarray], text_lines: List[Tuple[int, int, int, int]], cc2textline_assignment) :
123 | 	if len(ccs) == 0 :
124 | 		return
125 | 	for (x, y, w, h) in text_lines :
126 | 		final_mask = cv2.rectangle(final_mask, (x, y), (x + w, y + h), (255), -1)
127 | 	return final_mask
128 | 
129 | def complete_mask(img_np: np.ndarray, ccs: List[np.ndarray], text_lines: List[Tuple[int, int, int, int]], cc2textline_assignment) :
130 | 	if len(ccs) == 0 :
131 | 		return
132 | 	textline_ccs = [np.zeros_like(ccs[0]) for _ in range(len(text_lines))]
133 | 	for i, cc in enumerate(ccs) :
134 | 		txtline = cc2textline_assignment[i]
135 | 		textline_ccs[txtline] = cv2.bitwise_or(textline_ccs[txtline], cc)
136 | 	final_mask = np.zeros_like(ccs[0])
137 | 	img_np = cv2.bilateralFilter(img_np, 17, 80, 80)
138 | 	for i, cc in enumerate(tqdm(textline_ccs)) :
139 | 		x1, y1, w1, h1 = cv2.boundingRect(cc)
140 | 		text_size = min(w1, h1)
141 | 		extend_size = int(text_size * 0.1)
142 | 		x1 = max(x1 - extend_size, 0)
143 | 		y1 = max(y1 - extend_size, 0)
144 | 		w1 += extend_size * 2
145 | 		h1 += extend_size * 2
146 | 		w1 = min(w1, img_np.shape[1] - x1 - 1)
147 | 		h1 = min(h1, img_np.shape[0] - y1 - 1)
148 | 		dilate_size = max((int(text_size * 0.3) // 2) * 2 + 1, 3)
149 | 		kern = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (dilate_size, dilate_size))
150 | 		cc_region = np.ascontiguousarray(cc[y1: y1 + h1, x1: x1 + w1])
151 | 		if cc_region.size == 0 :
152 | 			continue
153 | 		#cv2.imshow('cc before', image_resize(cc_region, width = 256))
154 | 		img_region = np.ascontiguousarray(img_np[y1: y1 + h1, x1: x1 + w1])
155 | 		#cv2.imshow('img', image_resize(img_region, width = 256))
156 | 		cc_region = refine_mask(img_region, cc_region)
157 | 		#cv2.imshow('cc after', image_resize(cc_region, width = 256))
158 | 		#cv2.waitKey(0)
159 | 		cc[y1: y1 + h1, x1: x1 + w1] = cc_region
160 | 		cc = cv2.dilate(cc, kern)
161 | 		final_mask = cv2.bitwise_or(final_mask, cc)
162 | 	kern = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (3, 3))
163 | 	# for (x, y, w, h) in text_lines :
164 | 	# 	final_mask = cv2.rectangle(final_mask, (x, y), (x + w, y + h), (255), -1)
165 | 	return cv2.dilate(final_mask, kern)
166 | 
167 | def unsharp(image) :
168 | 	gaussian_3 = cv2.GaussianBlur(image, (3, 3), 2.0)
169 | 	return cv2.addWeighted(image, 1.5, gaussian_3, -0.5, 0, image)
170 | 
171 | from utils import Quadrilateral
172 | 
173 | def run_refine_mask(raw_image: np.ndarray, raw_mask: np.ndarray, textlines: List[Quadrilateral], method: str = 'fit_text') -> Tuple[np.ndarray, str] :
174 | 	mask_resized = cv2.resize(raw_mask, (raw_image.shape[1] // 2, raw_image.shape[0] // 2), interpolation = cv2.INTER_LINEAR)
175 | 	img_resized_2 = cv2.resize(raw_image, (raw_image.shape[1] // 2, raw_image.shape[0] // 2), interpolation = cv2.INTER_LINEAR)
176 | 	mask_resized[mask_resized > 0] = 255
177 | 	text_lines = [(int(a.aabb.x // 2), int(a.aabb.y // 2), int(a.aabb.w // 2), int(a.aabb.h // 2)) for a in textlines]
178 | 	mask_ccs, cc2textline_assignment = filter_masks(mask_resized, text_lines)
179 | 	if mask_ccs :
180 | 		if method == 'fit_text' :
181 | 			final_mask = complete_mask(img_resized_2, mask_ccs, text_lines, cc2textline_assignment)
182 | 		else :
183 | 			final_mask = complete_mask_fill(img_resized_2, mask_ccs, text_lines, cc2textline_assignment)
184 | 		final_mask = cv2.resize(final_mask, (raw_image.shape[1], raw_image.shape[0]), interpolation = cv2.INTER_LINEAR)
185 | 		final_mask[final_mask > 0] = 255
186 | 	else :
187 | 		final_mask = np.zeros((raw_image.shape[0], raw_image.shape[1]), dtype = np.uint8)
188 | 	return final_mask, "mask-refine-20220423"
189 | 


--------------------------------------------------------------------------------
/services/models/Cargo.lock:
--------------------------------------------------------------------------------
  1 | # This file is automatically @generated by Cargo.
  2 | # It is not intended for manual editing.
  3 | version = 3
  4 | 
  5 | [[package]]
  6 | name = "ahash"
  7 | version = "0.7.6"
  8 | source = "registry+https://github.com/rust-lang/crates.io-index"
  9 | checksum = "fcb51a0695d8f838b1ee009b3fbf66bda078cd64590202a864a8f3e8c4315c47"
 10 | dependencies = [
 11 |  "getrandom",
 12 |  "once_cell",
 13 |  "version_check",
 14 | ]
 15 | 
 16 | [[package]]
 17 | name = "autocfg"
 18 | version = "1.1.0"
 19 | source = "registry+https://github.com/rust-lang/crates.io-index"
 20 | checksum = "d468802bab17cbc0cc575e9b053f41e72aa36bfa6b7f55e3529ffa43161b97fa"
 21 | 
 22 | [[package]]
 23 | name = "base64"
 24 | version = "0.13.0"
 25 | source = "registry+https://github.com/rust-lang/crates.io-index"
 26 | checksum = "904dfeac50f3cdaba28fc6f57fdcddb75f49ed61346676a78c4ffe55877802fd"
 27 | 
 28 | [[package]]
 29 | name = "bson"
 30 | version = "2.1.0"
 31 | source = "registry+https://github.com/rust-lang/crates.io-index"
 32 | checksum = "41539b5c502b7c4e7b8af8ef07e5c442fe79ceba62a2aad8e62bd589b9454745"
 33 | dependencies = [
 34 |  "ahash",
 35 |  "base64",
 36 |  "chrono",
 37 |  "hex",
 38 |  "indexmap",
 39 |  "lazy_static",
 40 |  "rand",
 41 |  "serde",
 42 |  "serde_bytes",
 43 |  "serde_json",
 44 |  "uuid",
 45 | ]
 46 | 
 47 | [[package]]
 48 | name = "cfg-if"
 49 | version = "1.0.0"
 50 | source = "registry+https://github.com/rust-lang/crates.io-index"
 51 | checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 52 | 
 53 | [[package]]
 54 | name = "chrono"
 55 | version = "0.4.19"
 56 | source = "registry+https://github.com/rust-lang/crates.io-index"
 57 | checksum = "670ad68c9088c2a963aaa298cb369688cf3f9465ce5e2d4ca10e6e0098a1ce73"
 58 | dependencies = [
 59 |  "num-integer",
 60 |  "num-traits",
 61 | ]
 62 | 
 63 | [[package]]
 64 | name = "getrandom"
 65 | version = "0.2.4"
 66 | source = "registry+https://github.com/rust-lang/crates.io-index"
 67 | checksum = "418d37c8b1d42553c93648be529cb70f920d3baf8ef469b74b9638df426e0b4c"
 68 | dependencies = [
 69 |  "cfg-if",
 70 |  "libc",
 71 |  "wasi",
 72 | ]
 73 | 
 74 | [[package]]
 75 | name = "hashbrown"
 76 | version = "0.11.2"
 77 | source = "registry+https://github.com/rust-lang/crates.io-index"
 78 | checksum = "ab5ef0d4909ef3724cc8cce6ccc8572c5c817592e9285f5464f8e86f8bd3726e"
 79 | 
 80 | [[package]]
 81 | name = "hex"
 82 | version = "0.4.3"
 83 | source = "registry+https://github.com/rust-lang/crates.io-index"
 84 | checksum = "7f24254aa9a54b5c858eaee2f5bccdb46aaf0e486a595ed5fd8f86ba55232a70"
 85 | 
 86 | [[package]]
 87 | name = "indexmap"
 88 | version = "1.8.0"
 89 | source = "registry+https://github.com/rust-lang/crates.io-index"
 90 | checksum = "282a6247722caba404c065016bbfa522806e51714c34f5dfc3e4a3a46fcb4223"
 91 | dependencies = [
 92 |  "autocfg",
 93 |  "hashbrown",
 94 | ]
 95 | 
 96 | [[package]]
 97 | name = "itoa"
 98 | version = "1.0.1"
 99 | source = "registry+https://github.com/rust-lang/crates.io-index"
100 | checksum = "1aab8fc367588b89dcee83ab0fd66b72b50b72fa1904d7095045ace2b0c81c35"
101 | 
102 | [[package]]
103 | name = "lazy_static"
104 | version = "1.4.0"
105 | source = "registry+https://github.com/rust-lang/crates.io-index"
106 | checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
107 | 
108 | [[package]]
109 | name = "libc"
110 | version = "0.2.119"
111 | source = "registry+https://github.com/rust-lang/crates.io-index"
112 | checksum = "1bf2e165bb3457c8e098ea76f3e3bc9db55f87aa90d52d0e6be741470916aaa4"
113 | 
114 | [[package]]
115 | name = "models"
116 | version = "0.1.0"
117 | dependencies = [
118 |  "bson",
119 | ]
120 | 
121 | [[package]]
122 | name = "num-integer"
123 | version = "0.1.44"
124 | source = "registry+https://github.com/rust-lang/crates.io-index"
125 | checksum = "d2cc698a63b549a70bc047073d2949cce27cd1c7b0a4a862d08a8031bc2801db"
126 | dependencies = [
127 |  "autocfg",
128 |  "num-traits",
129 | ]
130 | 
131 | [[package]]
132 | name = "num-traits"
133 | version = "0.2.14"
134 | source = "registry+https://github.com/rust-lang/crates.io-index"
135 | checksum = "9a64b1ec5cda2586e284722486d802acf1f7dbdc623e2bfc57e65ca1cd099290"
136 | dependencies = [
137 |  "autocfg",
138 | ]
139 | 
140 | [[package]]
141 | name = "once_cell"
142 | version = "1.9.0"
143 | source = "registry+https://github.com/rust-lang/crates.io-index"
144 | checksum = "da32515d9f6e6e489d7bc9d84c71b060db7247dc035bbe44eac88cf87486d8d5"
145 | 
146 | [[package]]
147 | name = "ppv-lite86"
148 | version = "0.2.16"
149 | source = "registry+https://github.com/rust-lang/crates.io-index"
150 | checksum = "eb9f9e6e233e5c4a35559a617bf40a4ec447db2e84c20b55a6f83167b7e57872"
151 | 
152 | [[package]]
153 | name = "proc-macro2"
154 | version = "1.0.36"
155 | source = "registry+https://github.com/rust-lang/crates.io-index"
156 | checksum = "c7342d5883fbccae1cc37a2353b09c87c9b0f3afd73f5fb9bba687a1f733b029"
157 | dependencies = [
158 |  "unicode-xid",
159 | ]
160 | 
161 | [[package]]
162 | name = "quote"
163 | version = "1.0.15"
164 | source = "registry+https://github.com/rust-lang/crates.io-index"
165 | checksum = "864d3e96a899863136fc6e99f3d7cae289dafe43bf2c5ac19b70df7210c0a145"
166 | dependencies = [
167 |  "proc-macro2",
168 | ]
169 | 
170 | [[package]]
171 | name = "rand"
172 | version = "0.8.5"
173 | source = "registry+https://github.com/rust-lang/crates.io-index"
174 | checksum = "34af8d1a0e25924bc5b7c43c079c942339d8f0a8b57c39049bef581b46327404"
175 | dependencies = [
176 |  "libc",
177 |  "rand_chacha",
178 |  "rand_core",
179 | ]
180 | 
181 | [[package]]
182 | name = "rand_chacha"
183 | version = "0.3.1"
184 | source = "registry+https://github.com/rust-lang/crates.io-index"
185 | checksum = "e6c10a63a0fa32252be49d21e7709d4d4baf8d231c2dbce1eaa8141b9b127d88"
186 | dependencies = [
187 |  "ppv-lite86",
188 |  "rand_core",
189 | ]
190 | 
191 | [[package]]
192 | name = "rand_core"
193 | version = "0.6.3"
194 | source = "registry+https://github.com/rust-lang/crates.io-index"
195 | checksum = "d34f1408f55294453790c48b2f1ebbb1c5b4b7563eb1f418bcfcfdbb06ebb4e7"
196 | dependencies = [
197 |  "getrandom",
198 | ]
199 | 
200 | [[package]]
201 | name = "ryu"
202 | version = "1.0.9"
203 | source = "registry+https://github.com/rust-lang/crates.io-index"
204 | checksum = "73b4b750c782965c211b42f022f59af1fbceabdd026623714f104152f1ec149f"
205 | 
206 | [[package]]
207 | name = "serde"
208 | version = "1.0.136"
209 | source = "registry+https://github.com/rust-lang/crates.io-index"
210 | checksum = "ce31e24b01e1e524df96f1c2fdd054405f8d7376249a5110886fb4b658484789"
211 | dependencies = [
212 |  "serde_derive",
213 | ]
214 | 
215 | [[package]]
216 | name = "serde_bytes"
217 | version = "0.11.5"
218 | source = "registry+https://github.com/rust-lang/crates.io-index"
219 | checksum = "16ae07dd2f88a366f15bd0632ba725227018c69a1c8550a927324f8eb8368bb9"
220 | dependencies = [
221 |  "serde",
222 | ]
223 | 
224 | [[package]]
225 | name = "serde_derive"
226 | version = "1.0.136"
227 | source = "registry+https://github.com/rust-lang/crates.io-index"
228 | checksum = "08597e7152fcd306f41838ed3e37be9eaeed2b61c42e2117266a554fab4662f9"
229 | dependencies = [
230 |  "proc-macro2",
231 |  "quote",
232 |  "syn",
233 | ]
234 | 
235 | [[package]]
236 | name = "serde_json"
237 | version = "1.0.79"
238 | source = "registry+https://github.com/rust-lang/crates.io-index"
239 | checksum = "8e8d9fa5c3b304765ce1fd9c4c8a3de2c8db365a5b91be52f186efc675681d95"
240 | dependencies = [
241 |  "indexmap",
242 |  "itoa",
243 |  "ryu",
244 |  "serde",
245 | ]
246 | 
247 | [[package]]
248 | name = "syn"
249 | version = "1.0.86"
250 | source = "registry+https://github.com/rust-lang/crates.io-index"
251 | checksum = "8a65b3f4ffa0092e9887669db0eae07941f023991ab58ea44da8fe8e2d511c6b"
252 | dependencies = [
253 |  "proc-macro2",
254 |  "quote",
255 |  "unicode-xid",
256 | ]
257 | 
258 | [[package]]
259 | name = "unicode-xid"
260 | version = "0.2.2"
261 | source = "registry+https://github.com/rust-lang/crates.io-index"
262 | checksum = "8ccb82d61f80a663efe1f787a51b16b5a51e3314d6ac365b08639f52387b33f3"
263 | 
264 | [[package]]
265 | name = "uuid"
266 | version = "0.8.2"
267 | source = "registry+https://github.com/rust-lang/crates.io-index"
268 | checksum = "bc5cf98d8186244414c848017f0e2676b3fcb46807f6668a97dfe67359a3c4b7"
269 | dependencies = [
270 |  "getrandom",
271 |  "serde",
272 | ]
273 | 
274 | [[package]]
275 | name = "version_check"
276 | version = "0.9.4"
277 | source = "registry+https://github.com/rust-lang/crates.io-index"
278 | checksum = "49874b5167b65d7193b8aba1567f5c7d93d001cafc34600cee003eda787e483f"
279 | 
280 | [[package]]
281 | name = "wasi"
282 | version = "0.10.2+wasi-snapshot-preview1"
283 | source = "registry+https://github.com/rust-lang/crates.io-index"
284 | checksum = "fd6fbd9a79829dd1ad0cc20627bf1ed606756a7f77edff7b66b7064f9cb327c6"
285 | 


--------------------------------------------------------------------------------
/services/models/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "models"
 3 | version = "0.1.0"
 4 | edition = "2021"
 5 | 
 6 | # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 7 | 
 8 | [dependencies]
 9 | bson = "2.0.1"
10 | 


--------------------------------------------------------------------------------
/services/models/src/lib.rs:
--------------------------------------------------------------------------------
  1 | use std::collections::HashSet;
  2 | 
  3 | use bson::oid::ObjectId;
  4 | 
  5 | 
  6 | pub struct ImageSource {
  7 |     /// Canonicalized raw URL of source image (e.g. twitter CDN url)
  8 |     pub source_url: Option<String>,
  9 |     /// Canonicalized URL of web page for this image (e.g. twitter url)
 10 |     pub source_page: Option<String>,
 11 |     /// When is the image created, this is provided by its source website, fill this field whenever possible
 12 |     pub created_at: Option<bson::DateTime>,
 13 |     /// When is the image uploaded to cotrans
 14 |     pub uploaded_at: bson::DateTime,
 15 |     /// Who uploaded this image to cotrans
 16 |     pub uploaded_by: String,
 17 | }
 18 | 
 19 | pub struct OriginalImage {
 20 |     /// Sources of this image
 21 |     /// Use vec in case of same image being reposted at multiple websites
 22 |     pub sources: Vec<ImageSource>,
 23 |     /// Highest width of this image, there maybe multiple version of the same image exist
 24 |     /// we only keep the one with highest resolution
 25 |     pub width: u32,
 26 |     /// Highest height of this image, there maybe multiple version of the same image exist
 27 |     /// we only keep the one with highest resolution
 28 |     pub height: u32,
 29 |     /// File size in octets of the best version of this image
 30 |     pub file_size: u64,
 31 |     /// Format of this image (e.g. JPEG, PNG, WEBM)
 32 |     pub image_format: Option<String>,
 33 |     /// Number of channels in this image (e.g. 1 for grayscale, 3 for RGB, 4 for RGBA)
 34 |     pub channels: u32,
 35 |     /// When is image with this phash value first uploaded to cotrans
 36 |     pub created_at: bson::DateTime,
 37 |     /// Who is the first one uploaded image with this phash value to cotrans
 38 |     pub created_by: String,
 39 | 
 40 |     /// <KEY> Perceptual hash value of this image
 41 |     pub phash_value: String,
 42 |     /// Blockhash value of this image (optional)
 43 |     pub blockhash_value: Option<String>,
 44 |     /// Wavelet hash value of this image (optional)
 45 |     pub whash_value: Option<String>,
 46 | 
 47 |     /// Link to cotrans' store of this image, likely a Cloudflare image link
 48 |     pub url: String,
 49 |     /// Optional backup links to this image
 50 |     pub backup_urls: Option<Vec<String>>,
 51 |     /// SHA256 hash of this image
 52 |     pub sha256_value: String
 53 | }
 54 | 
 55 | /// For flexibility, result does not have a fixed form
 56 | pub enum FreeFormResult {
 57 |     JSON(String),
 58 |     XML(String)
 59 | }
 60 | 
 61 | pub struct TextExtractionResult {
 62 |     /// Link to mask generated
 63 |     pub mask_url: String,
 64 | 
 65 |     /// Format of result
 66 |     pub format: String,
 67 |     /// Extracted text
 68 |     pub result: FreeFormResult
 69 | }
 70 | 
 71 | /// Record of a automatic text extraction operation, incldues both metadata and result
 72 | pub struct TextExtraction {
 73 |     /// Which image is this record for
 74 |     pub phash_value: String,
 75 |     /// When is this text extraction request made
 76 |     pub created_at: bson::DateTime,
 77 |     /// Who made this text extraction request
 78 |     pub created_by: String,
 79 |     /// How long did this request take to finish
 80 |     pub time_used_ms: u32,
 81 |     /// Log
 82 |     pub log: Option<String>,
 83 | 
 84 |     /// Name and version of detector (e.g. `DBNet-RN101-v20210711`)
 85 |     pub detector: String,
 86 |     /// Name and version of OCR (e.g. `OCR-AR-48px-v20210921`)
 87 |     pub ocr: String,
 88 | 
 89 |     /// Height of image sent to detector
 90 |     pub detection_height: u32,
 91 |     /// Width of image sent to detector
 92 |     pub detection_width: u32,
 93 | 
 94 |     /// Extraction result
 95 |     pub result: TextExtractionResult
 96 | }
 97 | 
 98 | pub struct Inpainting {
 99 |     /// Inpainting model name and version (e.g. `LaMa-v20220220`)
100 |     pub model: String,
101 |     /// Link to inpainted image
102 |     pub inpainted_url: String,
103 |     /// Link to mask used during inpainting
104 |     pub mask: String,
105 |     /// Width of image used for inpainting
106 |     pub width: u32,
107 |     /// Height of image used for inpainting
108 |     pub height: u32,
109 |     /// Blending method used, one of `replace`, `poisson`, `cutout`
110 |     pub blending: String
111 | }
112 | 
113 | pub struct Typesetting {
114 | 
115 | }
116 | 
117 | pub struct TextRendering {
118 | 
119 | }
120 | 
121 | 
122 | pub struct Translation {
123 |     /// Which image is this record for
124 |     pub phash_value: String,
125 |     /// Which extraction result is this record based on
126 |     pub extraction_id: Option<ObjectId>,
127 |     /// Which translation result is this record based on
128 |     pub translation_id: Option<ObjectId>,
129 |     /// When is this translation created
130 |     pub created_at: bson::DateTime,
131 |     /// Who made this translation
132 |     pub created_by: CreatedBy,
133 | 
134 |     /// Info related to inpaitning, empty if user did his own typesetting
135 |     pub inpainting: Option<Inpainting>,
136 |     /// Info related typesetting
137 |     pub typesetting: Option<Typesetting>,
138 |     /// Info related text rendering
139 |     pub text_rendering: Option<TextRendering>,
140 | 
141 |     /// Format of result
142 |     pub format: String,
143 |     /// Result
144 |     pub result: FreeFormResult,
145 |     /// Final image
146 |     pub final_url: String,
147 |     pub width: u32,
148 |     pub height: u32,
149 |     pub file_size: u64,
150 |     /// Backup links to this image
151 |     pub backup_urls: Option<Vec<String>>,
152 |     pub sha256_value: String,
153 | 
154 |     /// Upvotes
155 |     pub upvotes: u32,
156 |     /// Downvotes
157 |     pub downvotes: u32,
158 |     /// Score
159 |     pub score: u32
160 | }
161 | 
162 | pub struct User {
163 |     pub created_at: bson::DateTime,
164 |     pub password_hashed: Option<String>
165 | }
166 | 
167 | pub struct MachineTranslator {
168 |     pub name: String,
169 |     pub version: String
170 | }
171 | 
172 | pub enum CreatedBy {
173 |     User(ObjectId),
174 |     Machine(MachineTranslator)
175 | }
176 | 
177 | #[cfg(test)]
178 | mod tests {
179 |     #[test]
180 |     fn it_works() {
181 |         let result = 2 + 2;
182 |         assert_eq!(result, 4);
183 |     }
184 | }
185 | 


--------------------------------------------------------------------------------
/services/ocr_ctc_v1/main.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Any
 3 | from models import *
 4 | from ocr import load_model, run_ocr
 5 | 
 6 | import numpy as np
 7 | from PIL import Image
 8 | import io
 9 | import cv2
10 | import secrets
11 | 
12 | from fastapi import FastAPI, Form, File, UploadFile, Response
13 | from fastapi.responses import JSONResponse
14 | 
15 | from utils import Quadrilateral
16 | 
17 | app = FastAPI()
18 | 
19 | class JsonAndImageResponse(Response) :
20 | 	def render(self, content: Any) -> bytes:
21 | 		boundary = secrets.token_bytes(16).hex()
22 | 		json_data: dict = content["json"]
23 | 		img_data: Image.Image = content["img"]
24 | 		img_type: str = content["img-type"]
25 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"jsonData\";"
26 | 		json_content = json.dumps(json_data)
27 | 		ans = io.BytesIO()
28 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
29 | 		ans.write(b"Content-Type: application/json\r\nContent-ID: jsonData\r\n\r\n")
30 | 		ans.write(json_content.encode('utf-8'))
31 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
32 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
33 | 		img_data.save(ans, format = 'PNG')
34 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
35 | 		return ans.getvalue()
36 | 
37 | def get_bbox(tref: TextRegionExchangeFormat, w: int, h: int) :
38 | 	if tref.fmt == 'quad' :
39 | 		return Quadrilateral.from_tref(tref, w, h)
40 | 	elif tref.fmt == 'textbox' :
41 | 		raise NotImplemented
42 | 
43 | @app.post("/v1/ocr")
44 | async def ocr(config: V1OCRCTCRequest = Form(), image: UploadFile = File()) :
45 | 	img = Image.open(image.file)
46 | 	w, h = img.width, img.height
47 | 	img_np = np.asarray(img)
48 | 	regions = [get_bbox(t, w, h) for t in config.regions]
49 | 	quads, version = run_ocr(app, config, img_np, regions)
50 | 	resp = V1OCRCTCResponse(texts = [t.to_tref_and_normalize(w, h) for t in quads], version = version)
51 | 	return JSONResponse(resp.dict(exclude_none = True))
52 | 
53 | @app.on_event("startup")
54 | async def startup_event() :
55 | 	load_model(app)
56 | 


--------------------------------------------------------------------------------
/services/ocr_ctc_v1/models.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from __future__ import annotations
 3 | from typing import List, Optional, Tuple
 4 | from pydantic import BaseModel, ValidationError, validator
 5 | 
 6 | import json
 7 | 
 8 | class TextRegionExchangeFormat(BaseModel) :
 9 | 	fmt: str
10 | 	coords: str
11 | 	fg: Optional[Tuple[int, int, int]]
12 | 	bg: Optional[Tuple[int, int, int]]
13 | 	text: Optional[str]
14 | 	prob: Optional[float] = 0
15 | 	direction: Optional[str]
16 | 	lines: List[TextRegionExchangeFormat] = []
17 | 	
18 | TextRegionExchangeFormat.update_forward_refs()
19 | 
20 | class V1OCRCTCRequest(BaseModel) :
21 | 	regions: List[TextRegionExchangeFormat]
22 | 	max_chunk_size: int = 16
23 | 	cuda: bool = False
24 | 	text_prob_threshold: float = 0.3
25 | 
26 | 	@classmethod
27 | 	def __get_validators__(cls):
28 | 		yield cls.validate_to_json
29 | 
30 | 	@classmethod
31 | 	def validate_to_json(cls, value):
32 | 		if isinstance(value, str):
33 | 			return cls(**json.loads(value))
34 | 		return value
35 | 
36 | class V1OCRCTCResponse(BaseModel) :
37 | 	texts: List[TextRegionExchangeFormat]
38 | 	version: str
39 | 
40 | 	@classmethod
41 | 	def __get_validators__(cls):
42 | 		yield cls.validate_to_json
43 | 
44 | 	@classmethod
45 | 	def validate_to_json(cls, value):
46 | 		if isinstance(value, str):
47 | 			return cls(**json.loads(value))
48 | 		return value
49 | 		


--------------------------------------------------------------------------------
/services/phash/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "phash"
 3 | version = "0.1.0"
 4 | edition = "2021"
 5 | 
 6 | # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 7 | 
 8 | [dependencies]
 9 | image = "0.23.14"
10 | img_hash = "3.2.0"
11 | hex = "0.4.3"
12 | 


--------------------------------------------------------------------------------
/services/phash/src/main.rs:
--------------------------------------------------------------------------------
1 | fn main() {
2 |     println!("Hello, world!");
3 | }
4 | 


--------------------------------------------------------------------------------
/services/text_detection_v1/dbnet_utils.py:
--------------------------------------------------------------------------------
  1 | 
  2 | import pyclipper
  3 | import cv2
  4 | import numpy as np
  5 | from shapely.geometry import Polygon
  6 | 
  7 | class SegDetectorRepresenter():
  8 | 	def __init__(self, thresh=0.6, box_thresh=0.8, max_candidates=1000, unclip_ratio=2.2):
  9 | 		self.min_size = 3
 10 | 		self.thresh = thresh
 11 | 		self.box_thresh = box_thresh
 12 | 		self.max_candidates = max_candidates
 13 | 		self.unclip_ratio = unclip_ratio
 14 | 
 15 | 	def __call__(self, batch, pred, is_output_polygon=False):
 16 | 		'''
 17 | 		batch: (image, polygons, ignore_tags
 18 | 		batch: a dict produced by dataloaders.
 19 | 			image: tensor of shape (N, C, H, W).
 20 | 			polygons: tensor of shape (N, K, 4, 2), the polygons of objective regions.
 21 | 			ignore_tags: tensor of shape (N, K), indicates whether a region is ignorable or not.
 22 | 			shape: the original shape of images.
 23 | 			filename: the original filenames of images.
 24 | 		pred:
 25 | 			binary: text region segmentation map, with shape (N, H, W)
 26 | 			thresh: [if exists] thresh hold prediction with shape (N, H, W)
 27 | 			thresh_binary: [if exists] binarized with threshhold, (N, H, W)
 28 | 		'''
 29 | 		pred = pred[:, 0, :, :]
 30 | 		segmentation = self.binarize(pred)
 31 | 		boxes_batch = []
 32 | 		scores_batch = []
 33 | 		for batch_index in range(pred.size(0)):
 34 | 			height, width = batch['shape'][batch_index]
 35 | 			if is_output_polygon:
 36 | 				boxes, scores = self.polygons_from_bitmap(pred[batch_index], segmentation[batch_index], width, height)
 37 | 			else:
 38 | 				boxes, scores = self.boxes_from_bitmap(pred[batch_index], segmentation[batch_index], width, height)
 39 | 			boxes_batch.append(boxes)
 40 | 			scores_batch.append(scores)
 41 | 		return boxes_batch, scores_batch
 42 | 
 43 | 	def binarize(self, pred):
 44 | 		return pred > self.thresh
 45 | 
 46 | 	def polygons_from_bitmap(self, pred, _bitmap, dest_width, dest_height):
 47 | 		'''
 48 | 		_bitmap: single map with shape (H, W),
 49 | 			whose values are binarized as {0, 1}
 50 | 		'''
 51 | 
 52 | 		assert len(_bitmap.shape) == 2
 53 | 		bitmap = _bitmap.cpu().numpy()  # The first channel
 54 | 		pred = pred.cpu().detach().numpy()
 55 | 		height, width = bitmap.shape
 56 | 		boxes = []
 57 | 		scores = []
 58 | 
 59 | 		contours, _ = cv2.findContours((bitmap * 255).astype(np.uint8), cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)
 60 | 
 61 | 		for contour in contours[:self.max_candidates]:
 62 | 			epsilon = 0.005 * cv2.arcLength(contour, True)
 63 | 			approx = cv2.approxPolyDP(contour, epsilon, True)
 64 | 			points = approx.reshape((-1, 2))
 65 | 			if points.shape[0] < 4:
 66 | 				continue
 67 | 			# _, sside = self.get_mini_boxes(contour)
 68 | 			# if sside < self.min_size:
 69 | 			#     continue
 70 | 			score = self.box_score_fast(pred, contour.squeeze(1))
 71 | 			if self.box_thresh > score:
 72 | 				continue
 73 | 
 74 | 			if points.shape[0] > 2:
 75 | 				box = self.unclip(points, unclip_ratio=self.unclip_ratio)
 76 | 				if len(box) > 1:
 77 | 					continue
 78 | 			else:
 79 | 				continue
 80 | 			box = box.reshape(-1, 2)
 81 | 			_, sside = self.get_mini_boxes(box.reshape((-1, 1, 2)))
 82 | 			if sside < self.min_size + 2:
 83 | 				continue
 84 | 
 85 | 			if not isinstance(dest_width, int):
 86 | 				dest_width = dest_width.item()
 87 | 				dest_height = dest_height.item()
 88 | 
 89 | 			box[:, 0] = np.clip(np.round(box[:, 0] / width * dest_width), 0, dest_width)
 90 | 			box[:, 1] = np.clip(np.round(box[:, 1] / height * dest_height), 0, dest_height)
 91 | 			boxes.append(box)
 92 | 			scores.append(score)
 93 | 		return boxes, scores
 94 | 
 95 | 	def boxes_from_bitmap(self, pred, _bitmap, dest_width, dest_height):
 96 | 		'''
 97 | 		_bitmap: single map with shape (H, W),
 98 | 			whose values are binarized as {0, 1}
 99 | 		'''
100 | 
101 | 		assert len(_bitmap.shape) == 2
102 | 		bitmap = _bitmap.cpu().numpy()  # The first channel
103 | 		pred = pred.cpu().detach().numpy()
104 | 		height, width = bitmap.shape
105 | 		try :
106 | 			contours, _ = cv2.findContours((bitmap * 255).astype(np.uint8), cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)
107 | 		except ValueError :
108 | 			return [], []
109 | 		num_contours = min(len(contours), self.max_candidates)
110 | 		boxes = np.zeros((num_contours, 4, 2), dtype=np.int16)
111 | 		scores = np.zeros((num_contours,), dtype=np.float32)
112 | 
113 | 		for index in range(num_contours):
114 | 			contour = contours[index].squeeze(1)
115 | 			points, sside = self.get_mini_boxes(contour)
116 | 			if sside < self.min_size:
117 | 				continue
118 | 			points = np.array(points)
119 | 			score = self.box_score_fast(pred, contour)
120 | 			if self.box_thresh > score:
121 | 				continue
122 | 
123 | 			box = self.unclip(points, unclip_ratio=self.unclip_ratio).reshape(-1, 1, 2)
124 | 			box, sside = self.get_mini_boxes(box)
125 | 			if sside < self.min_size + 2:
126 | 				continue
127 | 			box = np.array(box)
128 | 			if not isinstance(dest_width, int):
129 | 				dest_width = dest_width.item()
130 | 				dest_height = dest_height.item()
131 | 
132 | 			box[:, 0] = np.clip(np.round(box[:, 0] / width * dest_width), 0, dest_width)
133 | 			box[:, 1] = np.clip(np.round(box[:, 1] / height * dest_height), 0, dest_height)
134 | 			startidx = box.sum(axis=1).argmin()
135 | 			box = np.roll(box, 4-startidx, 0)
136 | 			box = np.array(box)
137 | 			boxes[index, :, :] = box.astype(np.int16)
138 | 			scores[index] = score
139 | 		return boxes, scores
140 | 
141 | 	def unclip(self, box, unclip_ratio=1.8):
142 | 		poly = Polygon(box)
143 | 		distance = poly.area * unclip_ratio / poly.length
144 | 		offset = pyclipper.PyclipperOffset()
145 | 		offset.AddPath(box, pyclipper.JT_ROUND, pyclipper.ET_CLOSEDPOLYGON)
146 | 		expanded = np.array(offset.Execute(distance))
147 | 		return expanded
148 | 
149 | 	def get_mini_boxes(self, contour):
150 | 		bounding_box = cv2.minAreaRect(contour)
151 | 		points = sorted(list(cv2.boxPoints(bounding_box)), key=lambda x: x[0])
152 | 
153 | 		index_1, index_2, index_3, index_4 = 0, 1, 2, 3
154 | 		if points[1][1] > points[0][1]:
155 | 			index_1 = 0
156 | 			index_4 = 1
157 | 		else:
158 | 			index_1 = 1
159 | 			index_4 = 0
160 | 		if points[3][1] > points[2][1]:
161 | 			index_2 = 2
162 | 			index_3 = 3
163 | 		else:
164 | 			index_2 = 3
165 | 			index_3 = 2
166 | 
167 | 		box = [points[index_1], points[index_2], points[index_3], points[index_4]]
168 | 		return box, min(bounding_box[1])
169 | 
170 | 	def box_score_fast(self, bitmap, _box):
171 | 		h, w = bitmap.shape[:2]
172 | 		box = _box.copy()
173 | 		xmin = np.clip(np.floor(box[:, 0].min()).astype(np.int32), 0, w - 1)
174 | 		xmax = np.clip(np.ceil(box[:, 0].max()).astype(np.int32), 0, w - 1)
175 | 		ymin = np.clip(np.floor(box[:, 1].min()).astype(np.int32), 0, h - 1)
176 | 		ymax = np.clip(np.ceil(box[:, 1].max()).astype(np.int32), 0, h - 1)
177 | 
178 | 		mask = np.zeros((ymax - ymin + 1, xmax - xmin + 1), dtype=np.uint8)
179 | 		box[:, 0] = box[:, 0] - xmin
180 | 		box[:, 1] = box[:, 1] - ymin
181 | 		cv2.fillPoly(mask, box.reshape(1, -1, 2).astype(np.int32), 1)
182 | 		return cv2.mean(bitmap[ymin:ymax + 1, xmin:xmax + 1], mask)[0]
183 | 


--------------------------------------------------------------------------------
/services/text_detection_v1/main.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Any
 3 | from models import *
 4 | from detector import load_model, run_detection
 5 | 
 6 | import numpy as np
 7 | from PIL import Image
 8 | import io
 9 | import cv2
10 | import secrets
11 | 
12 | from fastapi import FastAPI, Form, File, UploadFile, Response
13 | app = FastAPI()
14 | 
15 | class JsonAndImageResponse(Response) :
16 | 	def render(self, content: Any) -> bytes:
17 | 		boundary = secrets.token_bytes(16).hex()
18 | 		json_data: dict = content["json"]
19 | 		img_data: Image.Image = content["img"]
20 | 		img_type: str = content["img-type"]
21 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"jsonData\";"
22 | 		json_content = json.dumps(json_data)
23 | 		ans = io.BytesIO()
24 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
25 | 		ans.write(b"Content-Type: application/json\r\nContent-ID: jsonData\r\n\r\n")
26 | 		ans.write(json_content.encode('utf-8'))
27 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
28 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
29 | 		img_data.save(ans, format = 'PNG')
30 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
31 | 		return ans.getvalue()
32 | 
33 | class NparrayAndImageResponse(Response) :
34 | 	def render(self, content: Any) -> bytes:
35 | 		boundary = secrets.token_bytes(16).hex()
36 | 		np_data: np.ndarray = content["array"]
37 | 		img_data: Image.Image = content["img"]
38 | 		img_type: str = content["img-type"]
39 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"npData\";"
40 | 		ans = io.BytesIO()
41 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
42 | 		ans.write(b"Content-Type: application/vnd.voilelabs.nparray\r\nContent-ID: npData\r\n\r\n")
43 | 		np.save(ans, np_data)
44 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
45 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
46 | 		img_data.save(ans, format = 'PNG')
47 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
48 | 		return ans.getvalue()
49 | 
50 | class JsonAndNparrayAndImageResponse(Response) :
51 | 	def render(self, content: Any) -> bytes:
52 | 		boundary = secrets.token_bytes(16).hex()
53 | 		json_data: dict = content["json"]
54 | 		np_data: np.ndarray = content["array"]
55 | 		img_data: Image.Image = content["img"]
56 | 		img_type: str = content["img-type"]
57 | 		self.media_type = f"multipart/related; boundary={boundary}; start=\"jsonData\";"
58 | 		ans = io.BytesIO()
59 | 		json_content = json.dumps(json_data)
60 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
61 | 		ans.write(b"Content-Type: application/json\r\nContent-ID: jsonData\r\n\r\n")
62 | 		ans.write(json_content.encode('utf-8'))
63 | 		ans.write(f"--{boundary}\r\n".encode('utf-8'))
64 | 		ans.write(b"Content-Type: application/vnd.voilelabs.nparray\r\nContent-ID: npData\r\n\r\n")
65 | 		np.save(ans, np_data)
66 | 		ans.write(f"\r\n--{boundary}\r\n".encode('utf-8'))
67 | 		ans.write(f"Content-Type: image/{img_type}\r\nContent-ID: imageData\r\n\r\n".encode('utf-8'))
68 | 		img_data.save(ans, format = 'PNG')
69 | 		ans.write(f"\r\n--{boundary}--".encode('utf-8'))
70 | 		return ans.getvalue()
71 | 
72 | @app.post("/v1/detect")
73 | async def detect(config: V1TextDetectionRequest = Form(), image: UploadFile = File()) :
74 | 	img = Image.open(image.file)
75 | 	img_np = np.asarray(img)
76 | 	textlines, mask_np, version = run_detection(app, config, img_np)
77 | 	resp = V1TextDetectionResponse(regions = textlines, version = version)
78 | 	return JsonAndImageResponse({"json": resp.dict(exclude_none = True), "img": Image.fromarray(mask_np), "img-type": "png"})
79 | 
80 | @app.on_event("startup")
81 | async def startup_event() :
82 | 	load_model(app)
83 | 


--------------------------------------------------------------------------------
/services/text_detection_v1/models.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from __future__ import annotations
 3 | from typing import List, Optional, Tuple
 4 | from pydantic import BaseModel
 5 | 
 6 | import json
 7 | 
 8 | class TextRegionExchangeFormat(BaseModel) :
 9 | 	fmt: str
10 | 	coords: str
11 | 	fg: Optional[Tuple[int, int, int]]
12 | 	bg: Optional[Tuple[int, int, int]]
13 | 	text: Optional[str]
14 | 	prob: Optional[float] = 0
15 | 	direction: Optional[str]
16 | 	lines: List[TextRegionExchangeFormat] = []
17 | 
18 | TextRegionExchangeFormat.update_forward_refs()
19 | 
20 | class V1TextDetectionRequest(BaseModel):
21 | 	text_threshold: float = 0.5
22 | 	box_threshold: float = 0.7
23 | 	area_threshold: float = 16
24 | 	unclip_ratio: float = 2.3
25 | 	cuda: bool = False
26 | 	blur: bool = True
27 | 	blur_ks: int = 17
28 | 	blur_sigma_color: int = 80
29 | 	blur_sigma_space: int = 80
30 | 	target_ratio: float
31 | 	pad_width: int
32 | 	pad_height: int
33 | 	width: int # original image width
34 | 	height: int # original image height
35 | 
36 | 	@classmethod
37 | 	def __get_validators__(cls):
38 | 		yield cls.validate_to_json
39 | 
40 | 	@classmethod
41 | 	def validate_to_json(cls, value):
42 | 		if isinstance(value, str):
43 | 			return cls(**json.loads(value))
44 | 		return value
45 | 
46 | 
47 | class V1TextDetectionResponse(BaseModel) :
48 | 	regions: List[TextRegionExchangeFormat]
49 | 	version: str
50 | 
51 | 	@classmethod
52 | 	def __get_validators__(cls):
53 | 		yield cls.validate_to_json
54 | 
55 | 	@classmethod
56 | 	def validate_to_json(cls, value):
57 | 		if isinstance(value, str):
58 | 			return cls(**json.loads(value))
59 | 		return value
60 | 
61 | 


--------------------------------------------------------------------------------
/services/textline_merge_v1/main.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from typing import Any
 3 | from models import *
 4 | from textline_merge import run_merge
 5 | 
 6 | import numpy as np
 7 | from PIL import Image
 8 | import io
 9 | import cv2
10 | import secrets
11 | 
12 | from fastapi import FastAPI, Body
13 | from fastapi.responses import JSONResponse
14 | app = FastAPI()
15 | 
16 | @app.post("/v1/merge")
17 | async def merge(config: V1TextlineMergeRequest) :
18 | 	if isinstance(config, dict) :
19 | 		config = V1TextlineMergeRequest.parse_obj(config)
20 | 	textlines = [Quadrilateral.from_tref(t, config.width, config.height) for t in config.textlines]
21 | 	regions, version = run_merge(config, textlines, config.width, config.height)
22 | 	resp = V1TextlineMergeResponse(regions = [r.to_tref_and_normalize(config.width, config.height) for r in regions], version = version)
23 | 	return JSONResponse(resp.dict(exclude_none = True))
24 | 


--------------------------------------------------------------------------------
/services/textline_merge_v1/models.py:
--------------------------------------------------------------------------------
 1 | 
 2 | from __future__ import annotations
 3 | from typing import List, Optional, Tuple
 4 | from pydantic import BaseModel
 5 | 
 6 | import json
 7 | 
 8 | class TextRegionExchangeFormat(BaseModel) :
 9 | 	fmt: str
10 | 	coords: str
11 | 	fg: Optional[Tuple[int, int, int]]
12 | 	bg: Optional[Tuple[int, int, int]]
13 | 	text: Optional[str]
14 | 	prob: Optional[float] = 0
15 | 	direction: Optional[str]
16 | 	lines: List[TextRegionExchangeFormat] = []
17 | 
18 | from utils import Quadrilateral
19 | 
20 | TextRegionExchangeFormat.update_forward_refs()
21 | 
22 | class V1TextlineMergeRequest(BaseModel) :
23 | 	gamma: float = 0.5
24 | 	sigma: float = 2
25 | 	std_threshold: float = 6
26 | 	width: int
27 | 	height: int
28 | 	textlines: List[TextRegionExchangeFormat]
29 | 
30 | 	@classmethod
31 | 	def __get_validators__(cls):
32 | 		yield cls.validate_to_json
33 | 
34 | 	@classmethod
35 | 	def validate_to_json(cls, value):
36 | 		if isinstance(value, str):
37 | 			return cls(**json.loads(value))
38 | 		return value
39 | 
40 | class V1TextlineMergeResponse(BaseModel) :
41 | 	version: str
42 | 	regions: List[TextRegionExchangeFormat]
43 | 
44 | 	@classmethod
45 | 	def __get_validators__(cls):
46 | 		yield cls.validate_to_json
47 | 
48 | 	@classmethod
49 | 	def validate_to_json(cls, value):
50 | 		if isinstance(value, str):
51 | 			return cls(**json.loads(value))
52 | 		return value
53 | 


--------------------------------------------------------------------------------
/services/textline_merge_v1/textline_merge.py:
--------------------------------------------------------------------------------
  1 | 
  2 | from collections import Counter
  3 | import itertools
  4 | from typing import List, Set, Tuple
  5 | import unicodedata
  6 | 
  7 | import cv2
  8 | from utils import Quadrilateral, quadrilateral_can_merge_region_coarse
  9 | import numpy as np
 10 | import networkx as nx
 11 | 
 12 | def _is_whitespace(ch):
 13 | 	"""Checks whether `chars` is a whitespace character."""
 14 | 	# \t, \n, and \r are technically contorl characters but we treat them
 15 | 	# as whitespace since they are generally considered as such.
 16 | 	if ch == " " or ch == "\t" or ch == "\n" or ch == "\r" or ord(ch) == 0:
 17 | 		return True
 18 | 	cat = unicodedata.category(ch)
 19 | 	if cat == "Zs":
 20 | 		return True
 21 | 	return False
 22 | 
 23 | 
 24 | def _is_control(ch):
 25 | 	"""Checks whether `chars` is a control character."""
 26 | 	"""Checks whether `chars` is a whitespace character."""
 27 | 	# These are technically control characters but we count them as whitespace
 28 | 	# characters.
 29 | 	if ch == "\t" or ch == "\n" or ch == "\r":
 30 | 		return False
 31 | 	cat = unicodedata.category(ch)
 32 | 	if cat in ("Cc", "Cf"):
 33 | 		return True
 34 | 	return False
 35 | 
 36 | 
 37 | def _is_punctuation(ch):
 38 | 	"""Checks whether `chars` is a punctuation character."""
 39 | 	"""Checks whether `chars` is a whitespace character."""
 40 | 	cp = ord(ch)
 41 | 	# We treat all non-letter/number ASCII as punctuation.
 42 | 	# Characters such as "^", "$", and "`" are not in the Unicode
 43 | 	# Punctuation class but we treat them as punctuation anyways, for
 44 | 	# consistency.
 45 | 	if ((cp >= 33 and cp <= 47) or (cp >= 58 and cp <= 64) or
 46 | 		(cp >= 91 and cp <= 96) or (cp >= 123 and cp <= 126)):
 47 | 		return True
 48 | 	cat = unicodedata.category(ch)
 49 | 	if cat.startswith("P"):
 50 | 		return True
 51 | 	return False
 52 | 
 53 | def split_text_region(bboxes: List[Quadrilateral], region_indices: Set[int], gamma = 0.5, sigma = 2, std_threshold = 6.0) -> List[Set[int]] :
 54 | 	region_indices = list(region_indices)
 55 | 	if len(region_indices) == 1 :
 56 | 		# case #1
 57 | 		return [set(region_indices)]
 58 | 	if len(region_indices) == 2 :
 59 | 		# case #2
 60 | 		fs1 = bboxes[region_indices[0]].font_size
 61 | 		fs2 = bboxes[region_indices[1]].font_size
 62 | 		fs = max(fs1, fs2)
 63 | 		if bboxes[region_indices[0]].distance(bboxes[region_indices[1]]) < (1 + gamma) * fs \
 64 | 			and abs(bboxes[region_indices[0]].angle - bboxes[region_indices[1]].angle) < 4 * np.pi / 180 :
 65 | 			return [set(region_indices)]
 66 | 		else :
 67 | 			return [set([region_indices[0]]), set([region_indices[1]])]
 68 | 	# case 3
 69 | 	G = nx.Graph()
 70 | 	for idx in region_indices :
 71 | 		G.add_node(idx)
 72 | 	for (u, v) in itertools.combinations(region_indices, 2) :
 73 | 		G.add_edge(u, v, weight = bboxes[u].distance(bboxes[v]))
 74 | 	edges = nx.algorithms.tree.minimum_spanning_edges(G, algorithm = "kruskal", data = True)
 75 | 	edges = sorted(edges, key = lambda a: a[2]['weight'], reverse = True)
 76 | 	edge_weights = [a[2]['weight'] for a in edges]
 77 | 	fontsize = np.mean([bboxes[idx].font_size for idx in region_indices])
 78 | 	std = np.std(edge_weights)
 79 | 	mean = np.mean(edge_weights)
 80 | 	if (edge_weights[0] <= mean + std * sigma or edge_weights[0] <= fontsize * (1 + gamma)) and std < std_threshold :
 81 | 		return [set(region_indices)]
 82 | 	else :
 83 | 		if edge_weights[0] - edge_weights[1] < std * sigma and std < std_threshold :
 84 | 			return [set(region_indices)]
 85 | 		G = nx.Graph()
 86 | 		for idx in region_indices :
 87 | 			G.add_node(idx)
 88 | 		for edge in edges[1:] :
 89 | 			G.add_edge(edge[0], edge[1])
 90 | 		ans = []
 91 | 		for node_set in nx.algorithms.components.connected_components(G) :
 92 | 			ans.extend(split_text_region(bboxes, node_set, gamma = gamma, sigma = sigma, std_threshold = std_threshold))
 93 | 		return ans
 94 | 	pass
 95 | 
 96 | def count_valuable_text(text) :
 97 | 	return sum([1 for ch in text if not _is_punctuation(ch) and not _is_control(ch) and not _is_whitespace(ch)])
 98 | 
 99 | 
100 | def get_mini_boxes(contour):
101 | 	bounding_box = cv2.minAreaRect(contour)
102 | 	points = sorted(list(cv2.boxPoints(bounding_box)), key=lambda x: x[0])
103 | 
104 | 	index_1, index_2, index_3, index_4 = 0, 1, 2, 3
105 | 	if points[1][1] > points[0][1]:
106 | 		index_1 = 0
107 | 		index_4 = 1
108 | 	else:
109 | 		index_1 = 1
110 | 		index_4 = 0
111 | 	if points[3][1] > points[2][1]:
112 | 		index_2 = 2
113 | 		index_3 = 3
114 | 	else:
115 | 		index_2 = 3
116 | 		index_3 = 2
117 | 
118 | 	box = [points[index_1], points[index_2], points[index_3], points[index_4]]
119 | 	box = np.array(box)
120 | 	startidx = box.sum(axis=1).argmin()
121 | 	box = np.roll(box, 4-startidx, 0)
122 | 	box = np.array(box)
123 | 	return box
124 | 
125 | def merge_bboxes_text_region(bboxes: List[Quadrilateral], width, height, gamma = 0.5, sigma = 2, std_threshold = 6.0) :
126 | 	G = nx.Graph()
127 | 	for i, box in enumerate(bboxes) :
128 | 		G.add_node(i, box = box)
129 | 		bboxes[i].assigned_index = i
130 | 	# step 1: roughly divide into multiple text region candidates
131 | 	for ((u, ubox), (v, vbox)) in itertools.combinations(enumerate(bboxes), 2) :
132 | 		if quadrilateral_can_merge_region_coarse(ubox, vbox) :
133 | 			G.add_edge(u, v)
134 | 
135 | 	region_indices: List[Set[int]] = []
136 | 	for node_set in nx.algorithms.components.connected_components(G) :
137 | 		# step 2: split each region
138 | 		region_indices.extend(split_text_region(bboxes, node_set, gamma, sigma, std_threshold))
139 | 
140 | 	for node_set in region_indices :
141 | 		nodes = list(node_set)
142 | 		# get overall bbox
143 | 		txtlns = np.array(bboxes)[nodes]
144 | 		kq = np.concatenate([x.pts for x in txtlns], axis = 0)
145 | 		if sum([int(a.is_approximate_axis_aligned) for a in txtlns]) > len(txtlns) // 2 :
146 | 			max_coord = np.max(kq, axis = 0)
147 | 			min_coord = np.min(kq, axis = 0)
148 | 			merged_box = np.maximum(np.array([
149 | 				np.array([min_coord[0], min_coord[1]]),
150 | 				np.array([max_coord[0], min_coord[1]]),
151 | 				np.array([max_coord[0], max_coord[1]]),
152 | 				np.array([min_coord[0], max_coord[1]])
153 | 				]), 0)
154 | 			bbox = np.concatenate([a[None, :] for a in merged_box], axis = 0).astype(int)
155 | 		else :
156 | 			# TODO: use better method
157 | 			bbox = np.concatenate([a[None, :] for a in get_mini_boxes(kq)], axis = 0).astype(int)
158 | 		# calculate average fg and bg color
159 | 		fg_r = round(np.mean([box.fg_r for box in [bboxes[i] for i in nodes]]))
160 | 		fg_g = round(np.mean([box.fg_g for box in [bboxes[i] for i in nodes]]))
161 | 		fg_b = round(np.mean([box.fg_b for box in [bboxes[i] for i in nodes]]))
162 | 		bg_r = round(np.mean([box.bg_r for box in [bboxes[i] for i in nodes]]))
163 | 		bg_g = round(np.mean([box.bg_g for box in [bboxes[i] for i in nodes]]))
164 | 		bg_b = round(np.mean([box.bg_b for box in [bboxes[i] for i in nodes]]))
165 | 		# majority vote for direction
166 | 		dirs = [box.direction for box in [bboxes[i] for i in nodes]]
167 | 		majority_dir = Counter(dirs).most_common(1)[0][0]
168 | 		# sort
169 | 		if majority_dir == 'h' :
170 | 			nodes = sorted(nodes, key = lambda x: bboxes[x].aabb.y + bboxes[x].aabb.h // 2)
171 | 		elif majority_dir == 'v' :
172 | 			nodes = sorted(nodes, key = lambda x: -(bboxes[x].aabb.x + bboxes[x].aabb.w))
173 | 		# yield overall bbox and sorted indices
174 | 		yield bbox, nodes, majority_dir, fg_r, fg_g, fg_b, bg_r, bg_g, bg_b
175 | 
176 | from models import V1TextlineMergeRequest
177 | 
178 | def run_merge(cfg: V1TextlineMergeRequest, textlines: List[Quadrilateral], width: int, height: int) -> Tuple[List[Quadrilateral], str] :
179 | 	text_regions: List[Quadrilateral] = []
180 | 	new_textlines = []
181 | 	for (poly_regions, textline_indices, majority_dir, fg_r, fg_g, fg_b, bg_r, bg_g, bg_b) in merge_bboxes_text_region(textlines, width, height, cfg.gamma, cfg.sigma, cfg.std_threshold) :
182 | 		text = ''
183 | 		logprob_lengths = []
184 | 		for textline_idx in textline_indices :
185 | 			if not text :
186 | 				text = textlines[textline_idx].text
187 | 			else :
188 | 				last_ch = text[-1]
189 | 				cur_ch = textlines[textline_idx].text[0]
190 | 				if ord(last_ch) > 255 and ord(cur_ch) > 255 :
191 | 					text += textlines[textline_idx].text
192 | 				else :
193 | 					if last_ch == '-' and ord(cur_ch) < 255 :
194 | 						text = text[:-1] + textlines[textline_idx].text
195 | 					else :
196 | 						text += ' ' + textlines[textline_idx].text
197 | 			logprob_lengths.append((np.log(textlines[textline_idx].prob), len(textlines[textline_idx].text)))
198 | 		vc = count_valuable_text(text)
199 | 		total_logprobs = 0.0
200 | 		for (logprob, length) in logprob_lengths :
201 | 			total_logprobs += logprob * length
202 | 		total_logprobs /= sum([x[1] for x in logprob_lengths])
203 | 		# filter text region without characters
204 | 		if vc > 1 :
205 | 			region = Quadrilateral(poly_regions, text, np.exp(total_logprobs), fg_r, fg_g, fg_b, bg_r, bg_g, bg_b)
206 | 			region.clip(width, height)
207 | 			region.assigned_direction = majority_dir
208 | 			text_regions.append(region)
209 | 			for textline_idx in textline_indices :
210 | 				region.lines.append(textlines[textline_idx])
211 | 	return text_regions, "textline-merge-20220423"
212 | 	


--------------------------------------------------------------------------------
/services/wasm/.gitignore:
--------------------------------------------------------------------------------
1 | /target
2 | **/*.rs.bk
3 | Cargo.lock
4 | bin/
5 | pkg/
6 | wasm-pack.log
7 | 


--------------------------------------------------------------------------------
/services/wasm/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "wasm"
 3 | version = "0.1.0"
 4 | authors = ["QiroNT"]
 5 | edition = "2021"
 6 | 
 7 | [lib]
 8 | crate-type = ["cdylib", "rlib"]
 9 | 
10 | [features]
11 | default = ["wee_alloc"]
12 | 
13 | [dependencies]
14 | wasm-bindgen = "0.2.63"
15 | 
16 | # The `console_error_panic_hook` crate provides better debugging of panics by
17 | # logging them with `console.error`. This is great for development, but requires
18 | # all the `std::fmt` and `std::panicking` infrastructure, so isn't great for
19 | # code size when deploying.
20 | console_error_panic_hook = { version = "0.1.6", optional = true }
21 | 
22 | # `wee_alloc` is a tiny allocator for wasm that is only ~1K in code size
23 | # compared to the default allocator's ~10K. It is slower than the default
24 | # allocator, however.
25 | #
26 | # Unfortunately, `wee_alloc` requires nightly Rust when targeting wasm for now.
27 | wee_alloc = { version = "0.4.5", optional = true }
28 | 
29 | image = "0.23.14"
30 | img_hash = "3.2.0"
31 | hex = "0.4.3"
32 | 
33 | [dev-dependencies]
34 | wasm-bindgen-test = "0.3.13"
35 | 
36 | [profile.release]
37 | # Tell `rustc` to optimize for small code size.
38 | opt-level = "s"
39 | 


--------------------------------------------------------------------------------
/services/wasm/rust-toolchain:
--------------------------------------------------------------------------------
1 | nightly


--------------------------------------------------------------------------------
/services/wasm/src/lib.rs:
--------------------------------------------------------------------------------
 1 | mod utils;
 2 | 
 3 | use image::{ImageBuffer, RgbaImage};
 4 | use img_hash::{FilterType, HasherConfig};
 5 | use wasm_bindgen::prelude::*;
 6 | 
 7 | // When the `wee_alloc` feature is enabled, use `wee_alloc` as the global
 8 | // allocator.
 9 | #[cfg(feature = "wee_alloc")]
10 | #[global_allocator]
11 | static ALLOC: wee_alloc::WeeAlloc = wee_alloc::WeeAlloc::INIT;
12 | 
13 | #[wasm_bindgen]
14 | pub fn phash(rgba: Vec<u8>, width: u32, height: u32, hash_size: Option<u32>) -> String {
15 |     return phash_inner(rgba, width, height, hash_size.unwrap_or(16));
16 | }
17 | 
18 | fn phash_inner(rgba: Vec<u8>, width: u32, height: u32, hash_size: u32) -> String {
19 |     let image: RgbaImage = ImageBuffer::from_raw(width, height, rgba).unwrap();
20 | 
21 |     let hasher = HasherConfig::new()
22 |         .hash_size(hash_size, hash_size)
23 |         .resize_filter(FilterType::Lanczos3)
24 |         .to_hasher();
25 | 
26 |     let hash = hasher.hash_image(&image);
27 | 
28 |     return hex::encode(hash.as_bytes());
29 | }
30 | 


--------------------------------------------------------------------------------
/services/wasm/src/utils.rs:
--------------------------------------------------------------------------------
 1 | pub fn set_panic_hook() {
 2 |     // When the `console_error_panic_hook` feature is enabled, we can call the
 3 |     // `set_panic_hook` function at least once during initialization, and then
 4 |     // we will get better error messages if our code ever panics.
 5 |     //
 6 |     // For more details see
 7 |     // https://github.com/rustwasm/console_error_panic_hook#readme
 8 |     #[cfg(feature = "console_error_panic_hook")]
 9 |     console_error_panic_hook::set_once();
10 | }
11 | 


--------------------------------------------------------------------------------
/specs/cotrans.yaml:
--------------------------------------------------------------------------------
1 | # TODO: OpenAPI spec here
2 | 


--------------------------------------------------------------------------------
/types/.gitignore:
--------------------------------------------------------------------------------
1 | /dist/
2 | 


--------------------------------------------------------------------------------
/types/LICENSE:
--------------------------------------------------------------------------------
 1 | This is free and unencumbered software released into the public domain.
 2 | 
 3 | Anyone is free to copy, modify, publish, use, compile, sell, or
 4 | distribute this software, either in source code form or as a compiled
 5 | binary, for any purpose, commercial or non-commercial, and by any
 6 | means.
 7 | 
 8 | In jurisdictions that recognize copyright laws, the author or authors
 9 | of this software dedicate any and all copyright interest in the
10 | software to the public domain. We make this dedication for the benefit
11 | of the public at large and to the detriment of our heirs and
12 | successors. We intend this dedication to be an overt act of
13 | relinquishment in perpetuity of all present and future rights to this
14 | software under copyright law.
15 | 
16 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17 | EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18 | MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
19 | IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 | OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 | ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 | OTHER DEALINGS IN THE SOFTWARE.
23 | 
24 | For more information, please refer to <https://unlicense.org>


--------------------------------------------------------------------------------
/types/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "@cotrans/types",
 3 |   "type": "module",
 4 |   "version": "0.0.2",
 5 |   "private": false,
 6 |   "license": "Unlicense",
 7 |   "exports": {
 8 |     ".": {
 9 |       "require": "./dist/index.cjs",
10 |       "import": "./dist/index.mjs"
11 |     }
12 |   },
13 |   "main": "./dist/index.cjs",
14 |   "types": "./dist/index.d.ts",
15 |   "files": [
16 |     "dist"
17 |   ],
18 |   "scripts": {
19 |     "build": "unbuild"
20 |   },
21 |   "devDependencies": {
22 |     "unbuild": "^1.2.1"
23 |   }
24 | }
25 | 


--------------------------------------------------------------------------------
/types/src/index.ts:
--------------------------------------------------------------------------------
  1 | /* eslint-disable @typescript-eslint/ban-types */
  2 | 
  3 | export interface TaskResult {
  4 |   /**
  5 |    * The URL to a mask layer to be applied on top of the original image.
  6 |    *
  7 |    * When the mask is empty, this value will be a URI of exactly:<br>
  8 |    * `data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVQI12NgYAAAAAMAASDVlMcAAAAASUVORK5CYII=`<br>
  9 |    * Which is a transparent 1x1 PNG image.<br>
 10 |    * This image is only meant for backwards compatibility, and the client should skip masking in this case.
 11 |    *
 12 |    * @example
 13 |    * 'https://r2.cotrans.touhou.ai/mask/h4zjxwhjshl68pgfkwcad0w9.png'
 14 |    */
 15 |   translation_mask: string
 16 | }
 17 | 
 18 | export interface QueryV1MessagePending {
 19 |   /**
 20 |    * Indicates that the task is still in the queue.
 21 |    */
 22 |   type: 'pending'
 23 |   /**
 24 |    * The image's position in the queue, starts at 1.
 25 |    */
 26 |   pos: number
 27 | }
 28 | 
 29 | export interface QueryV1MessageStatus {
 30 |   /**
 31 |    * Streamed status updates for the task.
 32 |    */
 33 |   type: 'status'
 34 |   /**
 35 |    * The current status of the task.<br>
 36 |    * Current possible values are listed in the type, but more may be added in the future.
 37 |    *
 38 |    * Values beginning with `error-` should be considered as errors.
 39 |    * Upon receiving such message, the client will be disconnected shortly after,
 40 |    * without receiving an `error` message.
 41 |    */
 42 |   status: string & {}
 43 |   // cat manga_translator.py | sed -n -E "/server_send_status\(websocket, task\.id, |\.status\.status = |_report_progress\('/s/^.*'([^']+)'.*$/| '\1'/p" | sort | uniq
 44 |   | 'colorizing'
 45 |   | 'detection'
 46 |   | 'downloading'
 47 |   | 'downscaling'
 48 |   | 'error'
 49 |   | 'error-download'
 50 |   | 'error-lang'
 51 |   | 'error-translating'
 52 |   | 'error-upload'
 53 |   | 'finished'
 54 |   | 'inpainting'
 55 |   | 'mask-generation'
 56 |   | 'ocr'
 57 |   | 'pending'
 58 |   | 'preparing'
 59 |   | 'rendering'
 60 |   | 'saved'
 61 |   | 'saving'
 62 |   | 'skip-no-regions'
 63 |   | 'skip-no-text'
 64 |   | 'textline_merge'
 65 |   | 'translating'
 66 |   | 'uploading'
 67 |   | 'upscaling'
 68 | }
 69 | 
 70 | export interface QueryV1MessageResult {
 71 |   /**
 72 |    * Indicates that the task has finished and the result is available.
 73 |    */
 74 |   type: 'result'
 75 |   /**
 76 |    * The result of the task.
 77 |    */
 78 |   result: TaskResult
 79 | }
 80 | 
 81 | export interface QueryV1MessageError {
 82 |   /**
 83 |    * Indicates that the task has encountered an error.
 84 |    */
 85 |   type: 'error'
 86 |   /**
 87 |    * A unique identifier given each occurrence of an error.
 88 |    *
 89 |    * @example 'tz4a98xxat96iws9zmbrgj3a'
 90 |    */
 91 |   error_id?: string | null
 92 |   /**
 93 |    * An identifier for the error type.<br>
 94 |    * Current possible values are listed in the type, but more may be added in the future.
 95 |    */
 96 |   error?: string & {} | null
 97 |   | 'error-db'
 98 |   | 'error-worker'
 99 | }
100 | 
101 | export interface QueryV1MessageNotFound {
102 |   /**
103 |    * The given task id was not found in neither the queue nor the database.
104 |    */
105 |   type: 'not_found'
106 | }
107 | 
108 | /**
109 |  * A message returned by the `/task/:id/status/v1` or `/task/:id/event/v1` endpoint.
110 |  */
111 | export type QueryV1Message =
112 |   | QueryV1MessagePending
113 |   | QueryV1MessageStatus
114 |   | QueryV1MessageResult
115 |   | QueryV1MessageError
116 |   | QueryV1MessageNotFound
117 | 
118 | /**
119 |  * A message returned by the `/group/:group/event/v1` endpoint.
120 |  */
121 | export type GroupQueryV1Message = QueryV1Message & {
122 |   /**
123 |    * The id of the task.
124 |    */
125 |   id: string
126 | }
127 | 
128 | /**
129 |  * Indicates the task has been successfully processed or was added to the queue.
130 |  */
131 | export interface UploadV1ResultSuccess {
132 |   /**
133 |    * The id of the task.
134 |    */
135 |   id: string
136 |   /**
137 |    * The image's position in the queue, starts at 1.
138 |    */
139 |   pos?: number | null
140 |   /**
141 |    * The result of the task, if it was already processed.
142 |    */
143 |   result?: TaskResult | null
144 | }
145 | 
146 | /**
147 |  * Indicates the task could not be processed.
148 |  */
149 | export interface UploadV1ResultError {
150 |   id: null
151 |   /**
152 |    * An identifier for the error type.<br>
153 |    * Current possible values are listed in the type, but more may be added in the future.
154 |    *
155 |    * `group-limit`: The task has been binded to too many groups.<br>
156 |    * `queue-full`: The queue is full.<br>
157 |    * `fetch-failed`: The url could not be fetched. (only for `url` uploads)<br>
158 |    * `file-too-large`: The file is too large. Currently the limit is 20MiB.<br>
159 |    * `resize-crash`: The resize process crashed, usually due to insufficient memory.
160 |    * This can happen if the image has very large dimensions, or if the image is corrupted,
161 |    * or if the image uses a color type outside of `RGB`, `RGBA`, `L`, `LA`.
162 |    * The general guideline is to keep the image dimensions below 4096x4096.<br>
163 |    */
164 |   error?: string & {} | null
165 |   | 'group-limit'
166 |   | 'queue-full'
167 |   | 'fetch-failed'
168 |   | 'file-too-large'
169 |   | 'resize-crash'
170 | }
171 | 
172 | /**
173 |  * The result of the `/task/upload/v1` endpoint.
174 |  */
175 | export type UploadV1Result = UploadV1ResultSuccess | UploadV1ResultError
176 | 


--------------------------------------------------------------------------------
/types/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "baseUrl": ".",
 4 |     "module": "ESNext",
 5 |     "target": "ESNext",
 6 |     "lib": ["ESNext"],
 7 |     "strict": true,
 8 |     "esModuleInterop": true,
 9 |     "skipLibCheck": true,
10 |     "moduleResolution": "node",
11 |     "jsx": "preserve",
12 |     "resolveJsonModule": true,
13 |     "strictNullChecks": true,
14 |     "forceConsistentCasingInFileNames": true,
15 |     "paths": {
16 |       "@/*": ["*"]
17 |     }
18 |   },
19 |   "include": ["**/*.ts"],
20 |   "exclude": ["dist", "node_modules"]
21 | }
22 | 


--------------------------------------------------------------------------------
/uno.config.ts:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/VoileLabs/cotrans/08992fa0d89e40f22477e90a361823942f2f8c86/uno.config.ts


--------------------------------------------------------------------------------
/userscript/.gitignore:
--------------------------------------------------------------------------------
1 | /dist/
2 | 


--------------------------------------------------------------------------------
/userscript/.vscode/i18n-ally-custom-framework.yml:
--------------------------------------------------------------------------------
 1 | languageIds:
 2 |   - javascript
 3 |   - typescript
 4 |   - javascriptreact
 5 |   - typescriptreact
 6 | 
 7 | usageMatchRegex:
 8 |   - '[^\w\d]t\([''"`]({key})[''"`]'
 9 | 
10 | refactorTemplates:
11 |   - t('$1')
12 | 
13 | monopoly: true
14 | 


--------------------------------------------------------------------------------
/userscript/.vscode/settings.json:
--------------------------------------------------------------------------------
1 | {
2 |   "i18n-ally.localesPaths": [
3 |     "src/i18n"
4 |   ],
5 |   "i18n-ally.sourceLanguage": "zh-CN",
6 |   "i18n-ally.keystyle": "nested"
7 | }
8 | 


--------------------------------------------------------------------------------
/userscript/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "imgtrans-userscript",
 3 |   "type": "module",
 4 |   "version": "0.8.0-bata.17",
 5 |   "private": true,
 6 |   "scripts": {
 7 |     "build": "rollup -c",
 8 |     "buildw": "rollup -cw",
 9 |     "test": "vitest --run",
10 |     "testw": "vitest --watch",
11 |     "lint": "eslint --fix ."
12 |   },
13 |   "dependencies": {
14 |     "@solid-primitives/event-listener": "^2.2.13",
15 |     "@solid-primitives/map": "^0.4.6",
16 |     "@solid-primitives/mutation-observer": "^1.1.13",
17 |     "@solid-primitives/scheduled": "^1.4.0",
18 |     "@solid-primitives/utils": "^6.2.0",
19 |     "@twind/core": "^1.1.3",
20 |     "@twind/preset-autoprefix": "^1.0.7",
21 |     "@twind/preset-tailwind": "^1.1.4",
22 |     "solid-js": "^1.7.8"
23 |   },
24 |   "devDependencies": {
25 |     "@babel/core": "^7.22.9",
26 |     "@iconify-json/carbon": "^1.1.18",
27 |     "@iconify-json/fluent": "^1.1.27",
28 |     "@rollup/plugin-babel": "^6.0.3",
29 |     "@rollup/plugin-commonjs": "^25.0.3",
30 |     "@rollup/plugin-node-resolve": "^15.1.0",
31 |     "@rollup/plugin-yaml": "^4.1.1",
32 |     "@types/node": "^20.4.4",
33 |     "@types/tampermonkey": "^4.0.10",
34 |     "babel-preset-solid": "^1.7.7",
35 |     "esbuild": "^0.18.15",
36 |     "fast-glob": "^3.3.1",
37 |     "happy-dom": "^10.5.2",
38 |     "magic-string": "^0.30.1",
39 |     "resolve": "^1.22.2",
40 |     "rimraf": "^5.0.1",
41 |     "rollup": "^3.26.3",
42 |     "rollup-plugin-esbuild": "^5.0.0",
43 |     "unplugin-icons": "^0.16.5",
44 |     "vitest": "^0.33.0"
45 |   }
46 | }
47 | 


--------------------------------------------------------------------------------
/userscript/rollup.config.js:
--------------------------------------------------------------------------------
 1 | import path from 'node:path'
 2 | import fs from 'node:fs'
 3 | import resolve from 'resolve'
 4 | import glob from 'fast-glob'
 5 | import { defineConfig } from 'rollup'
 6 | import { nodeResolve } from '@rollup/plugin-node-resolve'
 7 | import commonjs from '@rollup/plugin-commonjs'
 8 | import esbuild from 'rollup-plugin-esbuild'
 9 | import icons from 'unplugin-icons/rollup'
10 | import yaml from '@rollup/plugin-yaml'
11 | import { babel } from '@rollup/plugin-babel'
12 | import info from './package.json' assert { type: 'json' }
13 | 
14 | function fileExists(filePath) {
15 |   try {
16 |     return fs.statSync(filePath).isFile()
17 |   }
18 |   catch {
19 |     return false
20 |   }
21 | }
22 | 
23 | function scanLicenses() {
24 |   const pending = new Set(Object.keys(info.dependencies))
25 |   const res = []
26 |   for (const lib of pending) {
27 |     const pkgJsonPath = resolve.sync(`${lib}/package.json`)
28 |     const pkgPath = path.dirname(pkgJsonPath)
29 |     const pkgJson = JSON.parse(fs.readFileSync(pkgJsonPath, 'utf-8'))
30 | 
31 |     if ('dependencies' in pkgJson) {
32 |       for (const dep of Object.keys(pkgJson.dependencies))
33 |         pending.add(dep)
34 |     }
35 | 
36 |     if (fileExists(path.join(pkgPath, 'LICENSE')))
37 |       res.push(path.join(pkgPath, 'LICENSE'))
38 |   }
39 |   return res
40 | }
41 | 
42 | function gennerateConfig(input, output, banner) {
43 |   return defineConfig({
44 |     input,
45 |     output: {
46 |       dir: 'dist',
47 |       entryFileNames: output,
48 |       format: 'iife',
49 |       generatedCode: 'es2015',
50 |       banner: fs
51 |         .readFileSync(banner, 'utf8')
52 |         .replace(/{{version}}/g, info.version),
53 |       footer: `\n${glob.sync([
54 |         '../LICENSE',
55 |         'src/**/LICENSE*',
56 |         ...scanLicenses(),
57 |       ], { onlyFiles: true })
58 |         .map(file => `/*\n${fs.readFileSync(file, 'utf-8').trimEnd()}\n*/`)
59 |         .filter((v, i, a) => a.indexOf(v) === i)
60 |         .join('\n\n')}`,
61 |     },
62 |     plugins: [
63 |       nodeResolve(),
64 |       commonjs(),
65 |       yaml(),
66 |       icons({
67 |         compiler: 'solid',
68 |       }),
69 |       esbuild({
70 |         charset: 'utf8',
71 |         target: 'es2020',
72 |       }),
73 |       babel({
74 |         extensions: ['.js', '.jsx', '.ts', '.tsx'],
75 |         babelHelpers: 'bundled',
76 |         presets: [
77 |           ['babel-preset-solid', {
78 |             delegateEvents: false,
79 |           }],
80 |         ],
81 |       }),
82 |     ],
83 |   })
84 | }
85 | 
86 | export default [
87 |   gennerateConfig('src/main-regular.ts', 'imgtrans-userscript.user.js', 'src/banner-regular.js'),
88 |   gennerateConfig('src/main-nsfw.ts', 'imgtrans-userscript-nsfw.user.js', 'src/banner-nsfw.js'),
89 | ]
90 | 


--------------------------------------------------------------------------------
/userscript/src/banner-nsfw.js:
--------------------------------------------------------------------------------
 1 | // ==UserScript==
 2 | // @name              Cotrans Manga/Image Translator (NSFW Edition)
 3 | // @name:zh-CN        Cotrans 漫画/图片翻译器 (NSFW 版)
 4 | // @namespace         https://cotrans.touhou.ai/userscript/#nsfw
 5 | // @version           {{version}}
 6 | // @description       (WIP) Translate texts in images on E-Hentai(ExHentai)
 7 | // @description:zh-CN (WIP) 一键翻译图片内文字，支持 E-Hentai(ExHentai)
 8 | // @author            QiroNT
 9 | // @license           GPL-3.0
10 | // @contributionURL   https://ko-fi.com/voilelabs
11 | // @supportURL        https://discord.gg/975FRV8ca6
12 | // @source            https://cotrans.touhou.ai/
13 | // @include https://e-hentai.org/*
14 | // @match http://e-hentai.org/*
15 | // @include https://exhentai.org/*
16 | // @match http://exhentai.org/*
17 | // @connect e-hentai.org
18 | // @connect exhentai.org
19 | // @connect exhentai55ld2wyap5juskbm67czulomrouspdacjamjeloj7ugjbsad.onion
20 | // @connect hath.network
21 | // @connect api.cotrans.touhou.ai
22 | // @connect r2.cotrans.touhou.ai
23 | // @connect cotrans-r2.moe.ci
24 | // @connect *
25 | // @grant GM.xmlHttpRequest
26 | // @grant GM_xmlhttpRequest
27 | // @grant GM.setValue
28 | // @grant GM_setValue
29 | // @grant GM.getValue
30 | // @grant GM_getValue
31 | // @grant GM.deleteValue
32 | // @grant GM_deleteValue
33 | // @grant GM.addValueChangeListener
34 | // @grant GM_addValueChangeListener
35 | // @grant GM.removeValueChangeListener
36 | // @grant GM_removeValueChangeListener
37 | // @grant window.onurlchange
38 | // @run-at document-idle
39 | // ==/UserScript==
40 | 
41 | /* eslint-disable no-undef, unused-imports/no-unused-vars */
42 | const VERSION = '{{version}}'
43 | const EDITION = 'nsfw'
44 | let GMP
45 | {
46 |   // polyfill functions
47 |   const GMPFunctionMap = {
48 |     xmlHttpRequest: typeof GM_xmlhttpRequest !== 'undefined' ? GM_xmlhttpRequest : undefined,
49 |     setValue: typeof GM_setValue !== 'undefined' ? GM_setValue : undefined,
50 |     getValue: typeof GM_getValue !== 'undefined' ? GM_getValue : undefined,
51 |     deleteValue: typeof GM_deleteValue !== 'undefined' ? GM_deleteValue : undefined,
52 |     addValueChangeListener: typeof GM_addValueChangeListener !== 'undefined' ? GM_addValueChangeListener : undefined,
53 |     removeValueChangeListener: typeof GM_removeValueChangeListener !== 'undefined' ? GM_removeValueChangeListener : undefined,
54 |   }
55 |   const xmlHttpRequest = GM.xmlHttpRequest.bind(GM) || GMPFunctionMap.xmlHttpRequest
56 |   GMP = new Proxy(GM, {
57 |     get(target, prop) {
58 |       if (prop === 'xmlHttpRequest') {
59 |         return (context) => {
60 |           return new Promise((resolve, reject) => {
61 |             xmlHttpRequest({
62 |               ...context,
63 |               onload(event) {
64 |                 context.onload?.()
65 |                 resolve(event)
66 |               },
67 |               onerror(event) {
68 |                 context.onerror?.()
69 |                 reject(event)
70 |               },
71 |             })
72 |           })
73 |         }
74 |       }
75 |       if (prop in target) {
76 |         const v = target[prop]
77 |         return typeof v === 'function' ? v.bind(target) : v
78 |       }
79 |       if (prop in GMPFunctionMap && typeof GMPFunctionMap[prop] === 'function')
80 |         return GMPFunctionMap[prop]
81 | 
82 |       console.error(`[Cotrans Manga Translator] GM.${prop} isn't supported in your userscript engine and it's required by this script. This may lead to unexpected behavior.`)
83 |     },
84 |   })
85 | }
86 | 


--------------------------------------------------------------------------------
/userscript/src/banner-regular.js:
--------------------------------------------------------------------------------
 1 | // ==UserScript==
 2 | // @name              Cotrans Manga/Image Translator (Regular Edition)
 3 | // @name:zh-CN        Cotrans 漫画/图片翻译器 (常规版)
 4 | // @namespace         https://cotrans.touhou.ai/userscript/#regular
 5 | // @version           {{version}}
 6 | // @description       (WIP) Translate texts in images on Pixiv, Twitter, Misskey, Calckey
 7 | // @description:zh-CN (WIP) 一键翻译图片内文字，支持 Pixiv, Twitter, Misskey, Calckey
 8 | // @author            QiroNT
 9 | // @license           GPL-3.0
10 | // @contributionURL   https://ko-fi.com/voilelabs
11 | // @supportURL        https://discord.gg/975FRV8ca6
12 | // @source            https://cotrans.touhou.ai/
13 | // @include https://www.pixiv.net/*
14 | // @match https://www.pixiv.net/*
15 | // @include https://twitter.com/*
16 | // @match https://twitter.com/*
17 | // @include https://misskey.io/*
18 | // @match https://misskey.io/*
19 | // @include https://calckey.social/*
20 | // @match https://calckey.social/*
21 | // @include https://*
22 | // @match https://*
23 | // @connect pixiv.net
24 | // @connect pximg.net
25 | // @connect twitter.com
26 | // @connect twimg.com
27 | // @connect misskey.io
28 | // @connect misskeyusercontent.com
29 | // @connect s3.arkjp.net
30 | // @connect nfs.pub
31 | // @connect calckey.social
32 | // @connect backblazeb2.com
33 | // @connect dvd.moe
34 | // @connect api.cotrans.touhou.ai
35 | // @connect r2.cotrans.touhou.ai
36 | // @connect cotrans-r2.moe.ci
37 | // @connect *
38 | // @grant GM.xmlHttpRequest
39 | // @grant GM_xmlhttpRequest
40 | // @grant GM.setValue
41 | // @grant GM_setValue
42 | // @grant GM.getValue
43 | // @grant GM_getValue
44 | // @grant GM.deleteValue
45 | // @grant GM_deleteValue
46 | // @grant GM.addValueChangeListener
47 | // @grant GM_addValueChangeListener
48 | // @grant GM.removeValueChangeListener
49 | // @grant GM_removeValueChangeListener
50 | // @grant window.onurlchange
51 | // @run-at document-idle
52 | // ==/UserScript==
53 | 
54 | /* eslint-disable no-undef, unused-imports/no-unused-vars */
55 | const VERSION = '{{version}}'
56 | const EDITION = 'regular'
57 | let GMP
58 | {
59 |   // polyfill functions
60 |   const GMPFunctionMap = {
61 |     xmlHttpRequest: typeof GM_xmlhttpRequest !== 'undefined' ? GM_xmlhttpRequest : undefined,
62 |     setValue: typeof GM_setValue !== 'undefined' ? GM_setValue : undefined,
63 |     getValue: typeof GM_getValue !== 'undefined' ? GM_getValue : undefined,
64 |     deleteValue: typeof GM_deleteValue !== 'undefined' ? GM_deleteValue : undefined,
65 |     addValueChangeListener: typeof GM_addValueChangeListener !== 'undefined' ? GM_addValueChangeListener : undefined,
66 |     removeValueChangeListener: typeof GM_removeValueChangeListener !== 'undefined' ? GM_removeValueChangeListener : undefined,
67 |   }
68 |   const xmlHttpRequest = GM.xmlHttpRequest.bind(GM) || GMPFunctionMap.xmlHttpRequest
69 |   GMP = new Proxy(GM, {
70 |     get(target, prop) {
71 |       if (prop === 'xmlHttpRequest') {
72 |         return (context) => {
73 |           return new Promise((resolve, reject) => {
74 |             xmlHttpRequest({
75 |               ...context,
76 |               onload(event) {
77 |                 context.onload?.()
78 |                 resolve(event)
79 |               },
80 |               onerror(event) {
81 |                 context.onerror?.()
82 |                 reject(event)
83 |               },
84 |             })
85 |           })
86 |         }
87 |       }
88 |       if (prop in target) {
89 |         const v = target[prop]
90 |         return typeof v === 'function' ? v.bind(target) : v
91 |       }
92 |       if (prop in GMPFunctionMap && typeof GMPFunctionMap[prop] === 'function')
93 |         return GMPFunctionMap[prop]
94 | 
95 |       console.error(`[Cotrans Manga Translator] GM.${prop} isn't supported in your userscript engine and it's required by this script. This may lead to unexpected behavior.`)
96 |     },
97 |   })
98 | }
99 | 


--------------------------------------------------------------------------------
/userscript/src/eHentai/gallery.ts:
--------------------------------------------------------------------------------
 1 | import type { Translator, TranslatorInstance } from '../main'
 2 | 
 3 | function mount(): TranslatorInstance {
 4 |   const galleryId = window.location.pathname.match(/\/g\/(\d+)/)?.[1]
 5 |   if (!galleryId)
 6 |     return {}
 7 | 
 8 |   return {}
 9 | }
10 | 
11 | const translator: Translator = {
12 |   match(url) {
13 |     // https://e-hentai.org/g/<id>/<token>
14 |     // https://exhentai.org/g/<id>/<token>
15 |     // https://exhentai55ld2wyap5juskbm67czulomrouspdacjamjeloj7ugjbsad.onion/g/<id>/<token>
16 |     if (!url.hostname.endsWith('e-hentai.org') && !url.hostname.endsWith('exhentai.org')
17 |      && !url.hostname.endsWith('exhentai55ld2wyap5juskbm67czulomrouspdacjamjeloj7ugjbsad.onion'))
18 |       return false
19 |     if (!url.pathname.startsWith('/g/'))
20 |       return false
21 |     return true
22 |   },
23 |   mount,
24 | }
25 | 
26 | export default translator
27 | 


--------------------------------------------------------------------------------
/userscript/src/eHentai/page.ts:
--------------------------------------------------------------------------------
 1 | import type { Translator, TranslatorInstance } from '../main'
 2 | 
 3 | function mount(): TranslatorInstance {
 4 |   return {}
 5 | }
 6 | 
 7 | const translator: Translator = {
 8 |   match(url) {
 9 |     // https://e-hentai.org/s/<token>/<id>-<num>
10 |     // https://exhentai.org/s/<token>/<id>-<num>
11 |     // https://exhentai55ld2wyap5juskbm67czulomrouspdacjamjeloj7ugjbsad.onion/s/<token>/<id>-<num>
12 |     return false
13 |   },
14 |   mount,
15 | }
16 | 
17 | export default translator
18 | 


--------------------------------------------------------------------------------
/userscript/src/eHentai/settings.ts:
--------------------------------------------------------------------------------
 1 | import type { SettingsInjector, SettingsInjectorInstance } from '../main'
 2 | 
 3 | function mount(): SettingsInjectorInstance {
 4 |   return {}
 5 | }
 6 | 
 7 | const settingsInjector: SettingsInjector = {
 8 |   match(url) {
 9 |     return false
10 |   },
11 |   mount,
12 | }
13 | 
14 | export default settingsInjector
15 | 


--------------------------------------------------------------------------------
/userscript/src/i18n/en-US.yml:
--------------------------------------------------------------------------------
 1 | common:
 2 |   source:
 3 |     download-image: Downloading original image
 4 |     download-image-progress: Downloading original image ({progress})
 5 |     download-image-error: Error during original image download
 6 |   client:
 7 |     submit: Submitting translation
 8 |     submit-progress: Submitting translation ({progress})
 9 |     submit-final: Waiting for image transpile
10 |     submit-error: Error during translation submission
11 |     download-image: Downloading translated image
12 |     download-image-progress: Downloading translated image ({progress})
13 |     download-image-error: Error during translated image download
14 |     resize: Resizing image
15 |     merging: Merging layers
16 |   status:
17 |     default: Unknown status
18 |     pending: Pending
19 |     pending-pos: Pending, {pos} in queue
20 |     downloading: Transferring image
21 |     preparing: Waiting for idle window
22 |     colorizing: Colorizing
23 |     upscaling: Upscaling
24 |     downscaling: Downscaling
25 |     detection: Detecting text
26 |     ocr: Scanning text
27 |     textline_merge: Merging text lines
28 |     mask-generation: Generating mask
29 |     inpainting: Inpainting
30 |     translating: Translating
31 |     rendering: Rendering
32 |     finished: Finishing
33 |     saved: Saved
34 |     saving: Saving result
35 |     uploading: Transferring result
36 |     error: Error during translation
37 |     error-download: Image transfer failed
38 |     error-upload: Result transfer failed
39 |     error-lang: The target language is not supported by the chosen translator
40 |     error-translating: Did not get any text back from the text translation service
41 |     skip-no-regions: No text regions detected in the image
42 |     skip-no-text: No text detected in the image
43 |     error-with-id: 'Error during translation (ID: {id})'
44 |   control:
45 |     translate: Translate
46 |     batch: Translate all ({count})
47 |     reset: Reset
48 |   batch:
49 |     progress: Translating ({count}/{total} finished)
50 |     finish: Translation finished
51 |     error: Translation finished with errors
52 | settings:
53 |   detection-resolution: Text detection resolution
54 |   render-text-orientation: Render text orientation
55 |   render-text-orientation-options:
56 |     auto: Follow source
57 |     horizontal: Horizontal only
58 |     vertical: Vertical only
59 |   reset: Reset Settings
60 |   target-language: Translate target language
61 |   target-language-options:
62 |     auto: Follow website
63 |   text-detector: Text detector
64 |   text-detector-options:
65 |     default: Default
66 |   title: Cotrans Manga Translator Settings
67 |   translator: Translator
68 |   script-language: Userscript language
69 |   script-language-options:
70 |     auto: Follow website language
71 |   inline-options-title: Current Settings
72 |   detection-resolution-desc: >-
73 |     The resolution used to scan texts on an image, higher value are better
74 |     suited for smaller texts.
75 |   script-language-desc: Language of this userscript.
76 |   render-text-orientation-desc: Overwrite the orientation of texts rendered in the translated image.
77 |   target-language-desc: The language that images are translated to.
78 |   text-detector-desc: The detector used to scan texts in an image.
79 |   translator-desc: The translate service used to translate texts.
80 |   translator-options:
81 |     none: None (remove texts)
82 |   keep-instances-options:
83 |     until-reload: Until page reload
84 |     until-navigate: Until next navigation
85 |   keep-instances: Keep translation instances
86 |   keep-instances-desc: >-
87 |     How long before a translation instance is disposed. A translation instance
88 |     includes the translation state of an image, that is, whether the image is
89 |     translated or not, and the translation result. Keeping more translation
90 |     instances will result in more memory consumption.
91 |   force-retry: Force retry (ignore cache)
92 | sponsor:
93 |   text: If you find this script helpful, please consider supporting us!
94 | 


--------------------------------------------------------------------------------
/userscript/src/i18n/index.ts:
--------------------------------------------------------------------------------
  1 | import type { MaybeAccessor } from '@solid-primitives/utils'
  2 | import { access } from '@solid-primitives/utils'
  3 | import type { Accessor } from 'solid-js'
  4 | import { createMemo, createSignal } from 'solid-js'
  5 | import { scriptLang } from '../utils/storage'
  6 | 
  7 | import zhCN from './zh-CN.yml'
  8 | import enUS from './en-US.yml'
  9 | 
 10 | const messages: Record<string, any> = {
 11 |   'zh-CN': zhCN,
 12 |   'en-US': enUS,
 13 | }
 14 | 
 15 | function tryMatchLang(lang: string): string {
 16 |   if (lang.startsWith('zh'))
 17 |     return 'zh-CN'
 18 |   if (lang.startsWith('en'))
 19 |     return 'en-US'
 20 |   return 'en-US'
 21 | }
 22 | 
 23 | export const [realLang, setRealLang] = createSignal(navigator.language)
 24 | export const lang = createMemo(() => scriptLang() || tryMatchLang(realLang()))
 25 | 
 26 | export function t(key_: MaybeAccessor<string>, props: MaybeAccessor<Record<string, MaybeAccessor<unknown>>> = {}): Accessor<string> {
 27 |   return createMemo(() => {
 28 |     const key = access(key_)
 29 |     const segments = key.split('.')
 30 |     const msg: string = segments.reduce((obj, k) => obj[k], messages[lang()]) ?? segments.reduce((obj, k) => obj[k], messages['zh-CN'])
 31 |     if (!msg)
 32 |       return key
 33 |     return msg.replace(/\{([^}]+)\}/g, (_, k) => String(access(access(props)[k])) ?? '')
 34 |   })
 35 | }
 36 | 
 37 | let langEL: HTMLHtmlElement | undefined
 38 | let langObserver: MutationObserver | undefined
 39 | 
 40 | export function changeLangEl(el: HTMLHtmlElement) {
 41 |   if (langEL === el)
 42 |     return
 43 | 
 44 |   if (langObserver)
 45 |     langObserver.disconnect()
 46 | 
 47 |   langObserver = new MutationObserver((mutations) => {
 48 |     for (const mutation of mutations) {
 49 |       if (mutation.type === 'attributes' && mutation.attributeName === 'lang') {
 50 |         const target = mutation.target as HTMLHtmlElement
 51 |         if (target.lang)
 52 |           setRealLang(target.lang)
 53 |         break
 54 |       }
 55 |     }
 56 |   })
 57 |   langObserver.observe(el, { attributes: true })
 58 | 
 59 |   langEL = el
 60 |   setRealLang(el.lang)
 61 | }
 62 | 
 63 | export function BCP47ToISO639(code: string): string {
 64 |   try {
 65 |     const lo = new Intl.Locale(code)
 66 |     switch (lo.language) {
 67 |       case 'zh': {
 68 |         switch (lo.script) {
 69 |           case 'Hans':
 70 |             return 'CHS'
 71 |           case 'Hant':
 72 |             return 'CHT'
 73 |         }
 74 |         switch (lo.region) {
 75 |           case 'CN':
 76 |             return 'CHS'
 77 |           case 'HK':
 78 |           case 'TW':
 79 |             return 'CHT'
 80 |         }
 81 |         return 'CHS'
 82 |       }
 83 |       case 'ja':
 84 |         return 'JPN'
 85 |       case 'en':
 86 |         return 'ENG'
 87 |       case 'ko':
 88 |         return 'KOR'
 89 |       case 'vi':
 90 |         return 'VIE'
 91 |       case 'cs':
 92 |         return 'CSY'
 93 |       case 'nl':
 94 |         return 'NLD'
 95 |       case 'fr':
 96 |         return 'FRA'
 97 |       case 'de':
 98 |         return 'DEU'
 99 |       case 'hu':
100 |         return 'HUN'
101 |       case 'it':
102 |         return 'ITA'
103 |       case 'pl':
104 |         return 'PLK'
105 |       case 'pt':
106 |         return 'PTB'
107 |       case 'ro':
108 |         return 'ROM'
109 |       case 'ru':
110 |         return 'RUS'
111 |       case 'es':
112 |         return 'ESP'
113 |       case 'tr':
114 |         return 'TRK'
115 |       case 'uk':
116 |         return 'UKR'
117 |     }
118 |     return 'ENG'
119 |   }
120 |   catch (e) {
121 |     return 'ENG'
122 |   }
123 | }
124 | 


--------------------------------------------------------------------------------
/userscript/src/i18n/zh-CN.yml:
--------------------------------------------------------------------------------
 1 | common:
 2 |   source:
 3 |     download-image: 正在拉取原图
 4 |     download-image-progress: 正在拉取原图({progress})
 5 |     download-image-error: 拉取原图出错
 6 |   client:
 7 |     submit: 正在提交翻译
 8 |     submit-progress: 正在提交翻译({progress})
 9 |     submit-final: 等待图片转存
10 |     submit-error: 提交翻译出错
11 |     download-image: 正在下载图片
12 |     download-image-progress: 正在下载图片({progress})
13 |     download-image-error: 下载图片出错
14 |     resize: 正在缩放图片
15 |     merging: 正在合并图层
16 |   status:
17 |     default: 未知状态
18 |     pending: 正在等待
19 |     pending-pos: 正在等待，列队还有 {pos} 张图片
20 |     downloading: 正在传输图片
21 |     preparing: 等待空闲窗口
22 |     colorizing: 正在上色
23 |     upscaling: 正在放大图片
24 |     downscaling: 正在缩小图片
25 |     detection: 正在检测文本
26 |     ocr: 正在识别文本
27 |     textline_merge: 正在整合文本
28 |     mask-generation: 正在生成文本掩码
29 |     inpainting: 正在修补图片
30 |     translating: 正在翻译文本
31 |     rendering: 正在渲染文本
32 |     finished: 正在整理结果
33 |     saved: 保存结果
34 |     saving: 正在保存结果
35 |     uploading: 正在传输结果
36 |     error: 翻译出错
37 |     error-download: 传输图片失败
38 |     error-upload: 传输结果失败
39 |     error-lang: 你选择的翻译服务不支持你选择的语言
40 |     error-translating: 翻译服务没有返回任何文本
41 |     skip-no-regions: 图片中没有检测到文本区域
42 |     skip-no-text: 图片中没有检测到文本
43 |     error-with-id: '翻译出错 (ID: {id})'
44 |   control:
45 |     translate: 翻译
46 |     batch: 翻译全部 ({count})
47 |     reset: 还原
48 |   batch:
49 |     progress: 翻译中 ({count}/{total})
50 |     finish: 翻译完成
51 |     error: 翻译完成(有失败)
52 | settings:
53 |   title: Cotrans 图片翻译器设置
54 |   inline-options-title: 设置当前翻译
55 |   detection-resolution: 文本扫描清晰度
56 |   text-detector: 文本扫描器
57 |   text-detector-options:
58 |     default: 默认
59 |   translator: 翻译服务
60 |   render-text-orientation: 渲染字体方向
61 |   render-text-orientation-options:
62 |     auto: 跟随原文本
63 |     horizontal: 仅限水平
64 |     vertical: 仅限垂直
65 |   target-language: 翻译语言
66 |   target-language-options:
67 |     auto: 跟随网页语言
68 |   script-language: 用户脚本语言
69 |   script-language-options:
70 |     auto: 跟随网页语言
71 |   reset: 重置所有设置
72 |   detection-resolution-desc: 设置检测图片文本所用的清晰度，小文字适合使用更高的清晰度。
73 |   text-detector-desc: 设置使用的文本扫描器。
74 |   translator-desc: 设置翻译图片所用的翻译服务。
75 |   render-text-orientation-desc: 设置嵌字的文本方向。
76 |   target-language-desc: 设置图片翻译后的语言。
77 |   script-language-desc: 设置此用户脚本的语言。
78 |   translator-options:
79 |     none: None (删除文字)
80 |   keep-instances-options:
81 |     until-reload: 直到页面刷新
82 |     until-navigate: 直到下次跳转
83 |   keep-instances: 保留翻译进度
84 |   keep-instances-desc: >-
85 |     设置翻译进度的保留时间。 翻译进度即图片的翻译状态和翻译结果。
86 |     保留更多的翻译进度会占用更多的内存。
87 |   force-retry: 强制重试 (忽略缓存)
88 | sponsor:
89 |   text: 制作不易，请考虑赞助我们！
90 | 


--------------------------------------------------------------------------------
/userscript/src/main-nsfw.ts:
--------------------------------------------------------------------------------
 1 | import eHentaiGallery from './eHentai/gallery'
 2 | import eHentaiPage from './eHentai/page'
 3 | import eHentaiSettings from './eHentai/settings'
 4 | import { start } from './main'
 5 | 
 6 | start(
 7 |   [
 8 |     eHentaiGallery,
 9 |     eHentaiPage,
10 |   ],
11 |   [
12 |     eHentaiSettings,
13 |   ],
14 | )
15 | 


--------------------------------------------------------------------------------
/userscript/src/main-regular.ts:
--------------------------------------------------------------------------------
 1 | import { start } from './main'
 2 | import pixiv from './pixiv'
 3 | import pixivSettings from './pixiv/settings'
 4 | import twitter from './twitter'
 5 | import twitterSettings from './twitter/settings'
 6 | import misskey from './misskey'
 7 | 
 8 | start(
 9 |   [
10 |     pixiv,
11 |     twitter,
12 |     misskey,
13 |   ],
14 |   [
15 |     pixivSettings,
16 |     twitterSettings,
17 |   ],
18 | )
19 | 


--------------------------------------------------------------------------------
/userscript/src/main.ts:
--------------------------------------------------------------------------------
  1 | import { throttle } from '@solid-primitives/scheduled'
  2 | import { createRoot } from 'solid-js'
  3 | import { DelegatedEvents } from 'solid-js/web'
  4 | import { changeLangEl } from './i18n'
  5 | import { storageReady } from './utils/storage'
  6 | 
  7 | // https://github.com/solidjs/solid/issues/334#issuecomment-773807937
  8 | DelegatedEvents.clear()
  9 | 
 10 | export interface TranslatorInstance {
 11 |   canKeep?: (url: string) => unknown
 12 |   onURLChange?: (url: string) => unknown
 13 | }
 14 | export interface Translator {
 15 |   match: (url: URL) => unknown
 16 |   mount: () => TranslatorInstance
 17 | }
 18 | 
 19 | export interface SettingsInjectorInstance {
 20 |   canKeep?: (url: string) => unknown
 21 |   onURLChange?: (url: string) => unknown
 22 | }
 23 | export interface SettingsInjector {
 24 |   match: (url: URL) => unknown
 25 |   mount: () => SettingsInjectorInstance
 26 | }
 27 | 
 28 | type ScopedInstance<T> = Omit<T, 'dispose'> & {
 29 |   dispose: () => void
 30 | }
 31 | 
 32 | function createScopedInstance<T>(cb: () => T): ScopedInstance<T> {
 33 |   return createRoot((dispose) => {
 34 |     const instance = cb()
 35 |     return {
 36 |       ...instance,
 37 |       dispose,
 38 |     }
 39 |   })
 40 | }
 41 | 
 42 | let currentURL: string | undefined
 43 | let translator: ScopedInstance<TranslatorInstance> | undefined
 44 | let settingsInjector: ScopedInstance<SettingsInjectorInstance> | undefined
 45 | 
 46 | export async function start(translators: Translator[], settingsInjectors: SettingsInjector[]) {
 47 |   await storageReady
 48 | 
 49 |   async function onUpdate() {
 50 |     await new Promise<void>(resolve => (queueMicrotask ?? setTimeout)(resolve))
 51 | 
 52 |     if (currentURL !== location.href) {
 53 |       currentURL = location.href
 54 | 
 55 |       // there is a navigation in the page
 56 | 
 57 |       // update i18n element
 58 |       changeLangEl(document.documentElement as HTMLHtmlElement)
 59 | 
 60 |       // update translator
 61 |       // only if the translator needs to be updated
 62 |       if (translator?.canKeep?.(currentURL)) {
 63 |         translator.onURLChange?.(currentURL)
 64 |       }
 65 |       else {
 66 |         // unmount previous translator
 67 |         translator?.dispose()
 68 |         translator = undefined
 69 | 
 70 |         // check if the page is a image page
 71 |         const url = new URL(location.href)
 72 | 
 73 |         // find the first translator that matches the url
 74 |         const matched = translators.find(t => t.match(url))
 75 |         if (matched)
 76 |           translator = createScopedInstance(matched.mount)
 77 |       }
 78 | 
 79 |       /* update settings page */
 80 |       if (settingsInjector?.canKeep?.(currentURL)) {
 81 |         settingsInjector.onURLChange?.(currentURL)
 82 |       }
 83 |       else {
 84 |         // unmount previous settings injector
 85 |         settingsInjector?.dispose()
 86 |         settingsInjector = undefined
 87 | 
 88 |         // check if the page is a settings page
 89 |         const url = new URL(location.href)
 90 | 
 91 |         // find the first settings injector that matches the url
 92 |         const matched = settingsInjectors.find(t => t.match(url))
 93 |         if (matched)
 94 |           settingsInjector = createScopedInstance(matched.mount)
 95 |       }
 96 |     }
 97 |   }
 98 | 
 99 |   if (window.onurlchange === null) {
100 |     window.addEventListener('urlchange', onUpdate)
101 | 
102 |     // FIXME temporary fix for TM not firing urlchange event on hash change
103 |     const pushState = history.pushState
104 |     window.history.pushState = function () {
105 |       // eslint-disable-next-line prefer-rest-params
106 |       pushState.apply(this, arguments as any)
107 |       // eslint-disable-next-line prefer-rest-params
108 |       if (typeof arguments[2] === 'string' && arguments[2].startsWith('#'))
109 |         onUpdate()
110 |     }
111 |   }
112 |   else {
113 |     const installObserver = new MutationObserver(throttle(onUpdate, 200))
114 |     installObserver.observe(document.body, { childList: true, subtree: true })
115 |   }
116 |   onUpdate()
117 | }
118 | 


--------------------------------------------------------------------------------
/userscript/src/pixiv/settings.tsx:
--------------------------------------------------------------------------------
 1 | import { onCleanup } from 'solid-js'
 2 | import { render } from 'solid-js/web'
 3 | import { tw } from '../utils/twind'
 4 | import { t } from '../i18n'
 5 | import type { SettingsInjector, SettingsInjectorInstance } from '../main'
 6 | import { Settings } from '../settings'
 7 | 
 8 | function mount(): SettingsInjectorInstance {
 9 |   const wrapper = document.getElementById('wrapper')
10 |   if (!wrapper)
11 |     return {}
12 | 
13 |   const adFooter = wrapper.querySelector('.ad-footer')
14 |   if (!adFooter)
15 |     return {}
16 | 
17 |   const settingsContainer = document.createElement('div')
18 |   onCleanup(() => {
19 |     settingsContainer.remove()
20 |   })
21 | 
22 |   const disposeSettings = render(() => (
23 |     <div class={tw('mb-2.5 pt-2.5 px-5 pb-4 bg-white border border-solid border-[#d6dee5]')}>
24 |       <h2 class={tw('text-lg font-bold')}>
25 |         {t('settings.title')()}
26 |       </h2>
27 |       <div class={tw('w-[665px] my-2.5 mx-auto')}>
28 |         <Settings
29 |           itemOrientation="horizontal"
30 |           textStyle={{
31 |             'width': '185px',
32 |             'font-weight': 'bold',
33 |           }}
34 |         />
35 |       </div>
36 |     </div>
37 |   ), settingsContainer)
38 |   onCleanup(disposeSettings)
39 | 
40 |   wrapper.insertBefore(settingsContainer, adFooter)
41 | 
42 |   return {}
43 | }
44 | 
45 | const settingsInjector: SettingsInjector = {
46 |   match(url) {
47 |     // https://www.pixiv.net/setting_user.php
48 |     return url.hostname.endsWith('pixiv.net') && url.pathname.match(/\/setting_user\.php/)
49 |   },
50 |   mount,
51 | }
52 | 
53 | export default settingsInjector
54 | 


--------------------------------------------------------------------------------
/userscript/src/settings/index.tsx:
--------------------------------------------------------------------------------
  1 | import type { Accessor, Component, JSX } from 'solid-js'
  2 | import { For, Show } from 'solid-js'
  3 | import { tw } from '../utils/twind'
  4 | import { t } from '../i18n'
  5 | import {
  6 |   detectionResolution,
  7 |   keepInstances,
  8 |   renderTextOrientation,
  9 |   scriptLang,
 10 |   setDetectionResolution,
 11 |   setKeepInstances,
 12 |   setRenderTextOrientation,
 13 |   setScriptLang,
 14 |   setTargetLang,
 15 |   setTextDetector,
 16 |   setTranslatorService,
 17 |   targetLang,
 18 |   textDetector,
 19 |   translatorService,
 20 | } from '../utils/storage'
 21 | 
 22 | type OptionsMap = Record<string, Accessor<string>>
 23 | 
 24 | export const detectResOptionsMap = {
 25 |   S: () => '1024px',
 26 |   M: () => '1536px',
 27 |   L: () => '2048px',
 28 |   X: () => '2560px',
 29 | } satisfies OptionsMap
 30 | export const detectResOptions = Object.keys(detectResOptionsMap)
 31 | export type DetectResOption = keyof typeof detectResOptionsMap
 32 | 
 33 | export const renderTextDirOptionsMap = {
 34 |   auto: t('settings.render-text-orientation-options.auto'),
 35 |   h: t('settings.render-text-orientation-options.horizontal'),
 36 |   v: t('settings.render-text-orientation-options.vertical'),
 37 | } satisfies OptionsMap
 38 | export const renderTextDirOptions = Object.keys(renderTextDirOptionsMap)
 39 | export type RenderTextDirOption = keyof typeof renderTextDirOptionsMap
 40 | 
 41 | export const textDetectorOptionsMap = {
 42 |   default: t('settings.text-detector-options.default'),
 43 |   ctd: () => 'Comic Text Detector',
 44 | } satisfies OptionsMap
 45 | export const textDetectorOptions = Object.keys(textDetectorOptionsMap)
 46 | export type TextDetectorOption = keyof typeof textDetectorOptionsMap
 47 | 
 48 | export const translatorOptionsMap = {
 49 |   'gpt3.5': () => 'GPT-3.5',
 50 |   'youdao': () => 'Youdao',
 51 |   'baidu': () => 'Baidu',
 52 |   'google': () => 'Google',
 53 |   'deepl': () => 'DeepL',
 54 |   'papago': () => 'Papago',
 55 |   'offline': () => 'Sugoi / NLLB',
 56 |   'none': t('settings.translator-options.none'),
 57 | } satisfies OptionsMap
 58 | export const translatorOptions = Object.keys(translatorOptionsMap)
 59 | export type TranslatorOption = keyof typeof translatorOptionsMap
 60 | 
 61 | export const targetLangOptionsMap = {
 62 |   '': t('settings.target-language-options.auto'),
 63 |   'CHS': () => '简体中文',
 64 |   'CHT': () => '繁體中文',
 65 |   'JPN': () => '日本語',
 66 |   'ENG': () => 'English',
 67 |   'KOR': () => '한국어',
 68 |   'VIN': () => 'Tiếng Việt',
 69 |   'CSY': () => 'čeština',
 70 |   'NLD': () => 'Nederlands',
 71 |   'FRA': () => 'français',
 72 |   'DEU': () => 'Deutsch',
 73 |   'HUN': () => 'magyar nyelv',
 74 |   'ITA': () => 'italiano',
 75 |   'PLK': () => 'polski',
 76 |   'PTB': () => 'português',
 77 |   'ROM': () => 'limba română',
 78 |   'RUS': () => 'русский язык',
 79 |   'UKR': () => 'українська мова',
 80 |   'ESP': () => 'español',
 81 |   'TRK': () => 'Türk dili',
 82 | } satisfies OptionsMap
 83 | export const targetLangOptions = Object.keys(targetLangOptionsMap)
 84 | export type TargetLangOption = keyof typeof targetLangOptionsMap
 85 | 
 86 | export const scriptLangOptionsMap = {
 87 |   '': t('settings.script-language-options.auto'),
 88 |   'zh-CN': () => '简体中文',
 89 |   'en-US': () => 'English',
 90 | } satisfies OptionsMap
 91 | export const scriptLangOptions = Object.keys(scriptLangOptionsMap)
 92 | export type ScriptLangOption = keyof typeof scriptLangOptionsMap
 93 | 
 94 | export const keepInstancesOptionsMap = {
 95 |   'until-reload': t('settings.keep-instances-options.until-reload'),
 96 |   'until-navigate': t('settings.keep-instances-options.until-navigate'),
 97 | } satisfies OptionsMap
 98 | export const keepInstancesOptions = Object.keys(keepInstancesOptionsMap)
 99 | export type KeepInstancesOption = keyof typeof keepInstancesOptionsMap
100 | 
101 | export const Settings: Component<{
102 |   itemOrientation?: 'vertical' | 'horizontal'
103 |   textStyle?: JSX.HTMLAttributes<HTMLDivElement>['style']
104 | }> = (props) => {
105 |   const itemOrientation = () => props.itemOrientation ?? 'vertical'
106 |   const textStyle = () => props.textStyle ?? {}
107 | 
108 |   return (
109 |     <div class={tw('flex flex-col gap-2')}>
110 |       {/* Meta */}
111 |       <div>{EDITION} edition, v{VERSION}</div>
112 |       {/* Sponsor */}
113 |       <div>
114 |         {t('sponsor.text')()}
115 |       </div>
116 |       <div>
117 |         <For each={[
118 |           ['ko-fi', 'https://ko-fi.com/voilelabs'],
119 |           ['Patreon', 'https://patreon.com/voilelabs'],
120 |           ['爱发电', 'https://afdian.net/@voilelabs'],
121 |         ]}>{([name, url]) => (
122 |           <>
123 |             {' '}
124 |             <a
125 |               href={url}
126 |               target="_blank"
127 |               rel="noopener noreferrer"
128 |               class={tw('no-underline text-blue-600')}
129 |             >{name}</a>
130 |           </>
131 |         )}</For>
132 |       </div>
133 |       {/* Settings */}
134 |       <For each={[
135 |         [
136 |           t('settings.detection-resolution'),
137 |           detectionResolution, setDetectionResolution, detectResOptionsMap,
138 |           t('settings.detection-resolution-desc'),
139 |         ] as const,
140 |         [
141 |           t('settings.text-detector'),
142 |           textDetector, setTextDetector, textDetectorOptionsMap,
143 |           t('settings.text-detector-desc'),
144 |         ] as const,
145 |         [
146 |           t('settings.translator'),
147 |           translatorService, setTranslatorService, translatorOptionsMap,
148 |           t('settings.translator-desc'),
149 |         ] as const,
150 |         [
151 |           t('settings.render-text-orientation'),
152 |           renderTextOrientation, setRenderTextOrientation, renderTextDirOptionsMap,
153 |           t('settings.render-text-orientation-desc'),
154 |         ] as const,
155 |         [
156 |           t('settings.target-language'),
157 |           targetLang, setTargetLang, targetLangOptionsMap,
158 |           t('settings.target-language-desc'),
159 |         ] as const,
160 |         [
161 |           t('settings.script-language'),
162 |           scriptLang, setScriptLang, scriptLangOptionsMap,
163 |           t('settings.script-language-desc'),
164 |         ] as const,
165 |         [
166 |           t('settings.keep-instances'),
167 |           keepInstances, setKeepInstances, keepInstancesOptionsMap,
168 |           t('settings.keep-instances-desc'),
169 |         ] as const,
170 |       ]}>{([title, opt, setOpt, optMap, desc]) => (
171 |         <div class={itemOrientation() === 'horizontal' ? tw('flex items-center') : ''}>
172 |           <div style={textStyle()}>{title()}</div>
173 |           <div>
174 |             <select
175 |               value={opt()}
176 |               // @ts-expect-error setOpt are incompatible with each other
177 |               onChange={e => setOpt((e.target as HTMLSelectElement).value)}
178 |             >
179 |               {Object.entries(optMap).map(([value, label]) => (
180 |                 <option value={value}>{label()}</option>
181 |               ))}
182 |             </select>
183 |             <Show when={desc()}>
184 |               <div class={tw('text-sm')}>{desc()}</div>
185 |             </Show>
186 |           </div>
187 |         </div>
188 |       )}</For>
189 |       {/* Reset */}
190 |       <div>
191 |         <button
192 |           onClick={(e) => {
193 |             e.stopPropagation()
194 |             e.preventDefault()
195 | 
196 |             setDetectionResolution(null)
197 |             setTextDetector(null)
198 |             setTranslatorService(null)
199 |             setRenderTextOrientation(null)
200 |             setTargetLang(null)
201 |             setScriptLang(null)
202 |           }}
203 |         >{t('settings.reset')()}</button>
204 |       </div>
205 |     </div>
206 |   )
207 | }
208 | 


--------------------------------------------------------------------------------
/userscript/src/shims.d.ts:
--------------------------------------------------------------------------------
 1 | /* eslint-disable @typescript-eslint/no-explicit-any */
 2 | 
 3 | declare module '*.yaml' {
 4 |   const data: any
 5 |   export default data
 6 | }
 7 | declare module '*.yml' {
 8 |   const data: any
 9 |   export default data
10 | }
11 | 
12 | declare const GMP: typeof GM
13 | declare const VERSION: string
14 | declare const EDITION: 'regular' | 'nsfw'
15 | 


--------------------------------------------------------------------------------
/userscript/src/twitter/settings.tsx:
--------------------------------------------------------------------------------
  1 | import { createMutationObserver } from '@solid-primitives/mutation-observer'
  2 | import { throttle } from '@solid-primitives/scheduled'
  3 | import { onCleanup } from 'solid-js'
  4 | import { render } from 'solid-js/web'
  5 | import { tw } from '../utils/twind'
  6 | import { t } from '../i18n'
  7 | import type { SettingsInjector, SettingsInjectorInstance } from '../main'
  8 | import { Settings } from '../settings'
  9 | 
 10 | function mount(): SettingsInjectorInstance {
 11 |   let settingsTab: HTMLElement | undefined
 12 |   let disposeText: (() => void) | undefined
 13 |   const checkTab = () => {
 14 |     const tablist = document.querySelector('[role="tablist"]')
 15 |       || document.querySelector('[data-testid="loggedOutPrivacySection"]')
 16 |     if (!tablist) {
 17 |       if (disposeText) {
 18 |         disposeText()
 19 |         disposeText = undefined
 20 |       }
 21 |       return
 22 |     }
 23 | 
 24 |     if (tablist.querySelector(`div[data-imgtrans-settings-${EDITION}]`))
 25 |       return
 26 | 
 27 |     const inactiveRefrenceEl = Array.from(tablist.children)
 28 |       .find(el => el.children.length < 2 && el.querySelector('a'))
 29 |     if (!inactiveRefrenceEl)
 30 |       return
 31 | 
 32 |     settingsTab = inactiveRefrenceEl.cloneNode(true) as HTMLElement
 33 |     settingsTab.setAttribute(`data-imgtrans-settings-${EDITION}`, 'true')
 34 | 
 35 |     const textEl = settingsTab.querySelector('span')
 36 |     if (textEl) {
 37 |       while (textEl.firstChild)
 38 |         textEl.removeChild(textEl.firstChild)
 39 |       disposeText = render(() => t('settings.title')(), textEl)
 40 |       onCleanup(disposeText)
 41 |     }
 42 | 
 43 |     const linkEl = settingsTab.querySelector('a')
 44 |     if (linkEl)
 45 |       linkEl.href = `/settings/__imgtrans_${EDITION}`
 46 | 
 47 |     tablist.appendChild(settingsTab)
 48 |   }
 49 | 
 50 |   let disposeSettings: (() => void) | undefined
 51 |   const checkSettings = () => {
 52 |     const section = document.querySelector('[data-testid="error-detail"]')
 53 |       ?.parentElement?.parentElement as HTMLElement | null
 54 |     if (!section?.querySelector(`[data-imgtrans-settings-${EDITION}-section]`)) {
 55 |       if (disposeSettings) {
 56 |         disposeSettings()
 57 |         disposeSettings = undefined
 58 |       }
 59 |       if (!section)
 60 |         return
 61 |     }
 62 | 
 63 |     const title = `${t('settings.title')()} / Twitter`
 64 |     if (document.title !== title)
 65 |       document.title = title
 66 | 
 67 |     if (disposeSettings)
 68 |       return
 69 | 
 70 |     const errorPage = section.firstChild! as HTMLElement
 71 |     errorPage.style.display = 'none'
 72 | 
 73 |     const settingsContainer = document.createElement('div')
 74 |     settingsContainer.setAttribute(`data-imgtrans-settings-${EDITION}-section`, 'true')
 75 |     section.appendChild(settingsContainer)
 76 |     const disposeSettingsApp = render(() => {
 77 |       onCleanup(() => {
 78 |         errorPage.style.display = ''
 79 |       })
 80 | 
 81 |       return (
 82 |         // r-37j5jr: twitter font
 83 |         <div class={`${tw('px-4')} r-37j5jr`}>
 84 |           <div class={tw('flex items-center h-14')}>
 85 |             <h2 class={tw('text-xl leading-6')}>
 86 |               {t('settings.title')()}
 87 |             </h2>
 88 |           </div>
 89 |           <Settings />
 90 |         </div>
 91 |       )
 92 |     }, settingsContainer)
 93 |     disposeSettings = () => {
 94 |       disposeSettingsApp()
 95 |       settingsContainer.remove()
 96 |     }
 97 |     onCleanup(disposeSettings)
 98 |   }
 99 | 
100 |   createMutationObserver(
101 |     document.body,
102 |     { childList: true, subtree: true },
103 |     throttle(() => {
104 |       // since this throttled fn can be called after page navigation,
105 |       // we need to check if the page is still the settings page.
106 |       if (!location.pathname.startsWith('/settings'))
107 |         return
108 | 
109 |       // workaround for profile editing popup
110 |       if (location.pathname === '/settings/profile')
111 |         return
112 | 
113 |       checkTab()
114 | 
115 |       if (location.pathname.match(`/settings/__imgtrans_${EDITION}`)) {
116 |         if (settingsTab && settingsTab.children.length < 2) {
117 |           settingsTab.style.backgroundColor = '#F7F9F9'
118 |           const activeIndicator = document.createElement('div')
119 |           activeIndicator.className = tw('absolute z-10 inset-0 border-y-0 border-l-0 border-r-2 border-solid border-[#1D9Bf0] pointer-events-none')
120 |           settingsTab.appendChild(activeIndicator)
121 |         }
122 |         checkSettings()
123 |       }
124 |       else {
125 |         if (settingsTab && settingsTab.children.length > 1) {
126 |           settingsTab.style.backgroundColor = ''
127 |           settingsTab.removeChild(settingsTab.lastChild!)
128 |         }
129 |         if (disposeSettings) {
130 |           disposeSettings()
131 |           disposeSettings = undefined
132 |         }
133 |       }
134 |     }, 200),
135 |   )
136 | 
137 |   return {
138 |     canKeep(url) {
139 |       return url.includes('twitter.com') && url.includes('/settings')
140 |     },
141 |   }
142 | }
143 | 
144 | const settingsInjector: SettingsInjector = {
145 |   match(url) {
146 |     // https://twitter.com/settings/<tab>
147 |     return url.hostname.endsWith('twitter.com')
148 |       && (url.pathname === '/settings' || url.pathname.match(/^\/settings\//))
149 |       && url.pathname !== '/settings/profile'
150 |   },
151 |   mount,
152 | }
153 | 
154 | export default settingsInjector
155 | 


--------------------------------------------------------------------------------
/userscript/src/utils/core.ts:
--------------------------------------------------------------------------------
  1 | import type { Accessor } from 'solid-js'
  2 | import { BCP47ToISO639, realLang, t } from '../i18n'
  3 | import {
  4 |   detectionResolution,
  5 |   renderTextOrientation,
  6 |   targetLang,
  7 |   textDetector,
  8 |   translatorService,
  9 | } from './storage'
 10 | import { formatProgress } from '.'
 11 | 
 12 | export async function resizeToSubmit(blob: Blob, suffix: string): Promise<{ blob: Blob; suffix: string }> {
 13 |   const blobUrl = URL.createObjectURL(blob)
 14 |   const img = await new Promise<HTMLImageElement>((resolve, reject) => {
 15 |     const img = new Image()
 16 |     img.onload = () => resolve(img)
 17 |     img.onerror = err => reject(err)
 18 |     img.src = blobUrl
 19 |   })
 20 |   URL.revokeObjectURL(blobUrl)
 21 | 
 22 |   const w = img.width
 23 |   const h = img.height
 24 | 
 25 |   if (w <= 4096 && h <= 4096)
 26 |     return { blob, suffix }
 27 | 
 28 |   // resize to less than 4k
 29 |   const scale = Math.min(4096 / w, 4096 / h)
 30 |   const width = Math.floor(w * scale)
 31 |   const height = Math.floor(h * scale)
 32 | 
 33 |   const canvas = document.createElement('canvas')
 34 |   canvas.width = width
 35 |   canvas.height = height
 36 | 
 37 |   const ctx = canvas.getContext('2d')!
 38 |   ctx.imageSmoothingQuality = 'high'
 39 |   ctx.drawImage(img, 0, 0, width, height)
 40 | 
 41 |   const newBlob = await new Promise<Blob>((resolve, reject) => {
 42 |     canvas.toBlob((blob) => {
 43 |       if (blob)
 44 |         resolve(blob)
 45 |       else
 46 |         reject(new Error('Canvas toBlob failed'))
 47 |     }, 'image/png')
 48 |   })
 49 | 
 50 |   // console.log(`resized from ${w}x${h}(${formatSize(blob.size)},${suffix}) to ${width}x${height}(${formatSize(newBlob.size)},png)`)
 51 | 
 52 |   return {
 53 |     blob: newBlob,
 54 |     suffix: 'png',
 55 |   }
 56 | }
 57 | 
 58 | export interface TaskResult {
 59 |   translation_mask: string
 60 | }
 61 | 
 62 | export interface TranslateOptionsOverwrite {
 63 |   detectionResolution?: string
 64 |   renderTextOrientation?: string
 65 |   textDetector?: string
 66 |   translator?: string
 67 |   forceRetry?: boolean
 68 | }
 69 | export async function submitTranslate(
 70 |   blob: Blob,
 71 |   suffix: string,
 72 |   listeners: {
 73 |     onProgress?: (progress: string) => void
 74 |     onFinal?: () => void
 75 |   } = {},
 76 |   optionsOverwrite?: TranslateOptionsOverwrite,
 77 | ): Promise<{
 78 |   id: string
 79 |   status: string
 80 |   result?: TaskResult
 81 | }> {
 82 |   const { onProgress, onFinal } = listeners
 83 | 
 84 |   const formData = new FormData()
 85 |   formData.append('file', blob, `image.${suffix}`)
 86 |   formData.append('target_language', targetLang() || BCP47ToISO639(realLang()))
 87 |   formData.append('detector', optionsOverwrite?.textDetector ?? textDetector())
 88 |   formData.append('direction', optionsOverwrite?.renderTextOrientation ?? renderTextOrientation())
 89 |   formData.append('translator', optionsOverwrite?.translator ?? translatorService())
 90 |   formData.append('size', optionsOverwrite?.detectionResolution ?? detectionResolution())
 91 |   formData.append('retry', optionsOverwrite?.forceRetry ? 'true' : 'false')
 92 | 
 93 |   const result = await GMP.xmlHttpRequest({
 94 |     method: 'POST',
 95 |     url: 'https://api.cotrans.touhou.ai/task/upload/v1',
 96 |     // @ts-expect-error FormData is supported
 97 |     data: formData,
 98 |     upload: {
 99 |       onprogress: onProgress || onFinal
100 |         ? (e: ProgressEvent) => {
101 |             if (e.lengthComputable) {
102 |               if (e.loaded >= e.total - 16) {
103 |                 onFinal?.()
104 |               }
105 |               else {
106 |                 const p = formatProgress(e.loaded, e.total)
107 |                 onProgress?.(p)
108 |               }
109 |             }
110 |           }
111 |         : undefined,
112 |     },
113 |   })
114 | 
115 |   // console.log(result.responseText)
116 |   return JSON.parse(result.responseText)
117 | }
118 | 
119 | export function getStatusText(msg: QueryV1Message): Accessor<string> {
120 |   if (msg.type === 'pending')
121 |     return t('common.status.pending-pos', { pos: msg.pos })
122 |   if (msg.type === 'status')
123 |     return t(`common.status.${msg.status}`)
124 |   return t('common.status.default')
125 | }
126 | 
127 | type QueryV1Message = {
128 |   type: 'pending'
129 |   pos: number
130 | } | {
131 |   type: 'status'
132 |   status: string
133 | } | {
134 |   type: 'result'
135 |   result: {
136 |     translation_mask: string
137 |   }
138 | } | {
139 |   type: 'error'
140 |   error_id?: string
141 | } | {
142 |   type: 'not_found'
143 | }
144 | 
145 | export function pullTranslationStatus(id: string, cb: (status: Accessor<string>) => void) {
146 |   const ws = new WebSocket(`wss://api.cotrans.touhou.ai/task/${id}/event/v1`)
147 | 
148 |   return new Promise<TaskResult>((resolve, reject) => {
149 |     ws.onmessage = (e) => {
150 |       const msg = JSON.parse(e.data) as QueryV1Message
151 |       if (msg.type === 'result')
152 |         resolve(msg.result)
153 |       else if (msg.type === 'error')
154 |         reject(t('common.status.error-with-id', { id: msg.error_id }))
155 |       else
156 |         cb(getStatusText(msg))
157 |     }
158 |   })
159 | }
160 | 
161 | export async function pullTranslationStatusPolling(id: string, cb: (status: Accessor<string>) => void) {
162 |   while (true) {
163 |     const res = await GMP.xmlHttpRequest({
164 |       method: 'GET',
165 |       url: `https://api.cotrans.touhou.ai/task/${id}/status/v1`,
166 |     })
167 |     const msg = JSON.parse(res.responseText) as QueryV1Message
168 |     if (msg.type === 'result')
169 |       return msg.result
170 |     else if (msg.type === 'error')
171 |       throw t('common.status.error-with-id', { id: msg.error_id })
172 |     else
173 |       cb(getStatusText(msg))
174 | 
175 |     await new Promise(resolve => setTimeout(resolve, 1000))
176 |   }
177 | }
178 | 
179 | export async function downloadBlob(
180 |   url: string,
181 |   listeners: {
182 |     onProgress?: (progress: string) => void
183 |   } = {},
184 | ): Promise<Blob> {
185 |   const { onProgress } = listeners
186 | 
187 |   const res = await GMP.xmlHttpRequest({
188 |     method: 'GET',
189 |     responseType: 'blob',
190 |     url,
191 |     onprogress: onProgress
192 |       ? (e) => {
193 |           if (e.lengthComputable) {
194 |             const p = formatProgress(e.loaded, e.total)
195 |             onProgress(p)
196 |           }
197 |         }
198 |       : undefined,
199 |   })
200 | 
201 |   return res.response as Blob
202 | }
203 | 
204 | export async function blobToImageData(blob: Blob): Promise<ImageData> {
205 |   const blobUrl = URL.createObjectURL(blob)
206 | 
207 |   const img = await new Promise<HTMLImageElement>((resolve, reject) => {
208 |     const img = new Image()
209 |     img.onload = () => resolve(img)
210 |     img.onerror = err => reject(err)
211 |     img.src = blobUrl
212 |   })
213 |   URL.revokeObjectURL(blobUrl)
214 | 
215 |   const w = img.width
216 |   const h = img.height
217 | 
218 |   const canvas = document.createElement('canvas')
219 |   canvas.width = w
220 |   canvas.height = h
221 | 
222 |   const ctx = canvas.getContext('2d')!
223 |   ctx.drawImage(img, 0, 0)
224 |   return ctx.getImageData(0, 0, w, h)
225 | }
226 | 
227 | export async function imageDataToBlob(imageData: ImageData): Promise<Blob> {
228 |   const canvas = document.createElement('canvas')
229 |   canvas.width = imageData.width
230 |   canvas.height = imageData.height
231 |   const ctx = canvas.getContext('2d')!
232 |   ctx.putImageData(imageData, 0, 0)
233 | 
234 |   const blob = await new Promise<Blob>((resolve, reject) => {
235 |     canvas.toBlob((blob) => {
236 |       if (blob)
237 |         resolve(blob)
238 |       else
239 |         reject(new Error('Canvas toBlob failed'))
240 |     }, 'image/png')
241 |   })
242 | 
243 |   return blob
244 | }
245 | 


--------------------------------------------------------------------------------
/userscript/src/utils/index.ts:
--------------------------------------------------------------------------------
 1 | const mimeMap: Record<string, string> = {
 2 |   png: 'image/png',
 3 |   jpg: 'image/jpeg',
 4 |   gif: 'image/gif',
 5 |   webp: 'image/webp',
 6 | }
 7 | export function suffixToMime(suffix: string) {
 8 |   return mimeMap[suffix]
 9 | }
10 | 
11 | export function formatSize(bytes: number) {
12 |   const k = 1024
13 |   const sizes = ['B', 'KB', 'MB', 'GB', 'TB']
14 |   if (bytes === 0)
15 |     return '0B'
16 |   const i = Math.floor(Math.log(bytes) / Math.log(k))
17 |   return `${(bytes / k ** i).toFixed(2)}${sizes[i]}`
18 | }
19 | export function formatProgress(loaded: number, total: number) {
20 |   return `${formatSize(loaded)}/${formatSize(total)}`
21 | }
22 | 
23 | export function assert(condition: unknown, message?: string): asserts condition {
24 |   if (!condition)
25 |     throw new Error(message)
26 | }
27 | 


--------------------------------------------------------------------------------
/userscript/src/utils/storage.ts:
--------------------------------------------------------------------------------
 1 | import type { Accessor, Setter } from 'solid-js'
 2 | import { createEffect, createSignal, on, onCleanup } from 'solid-js'
 3 | import type {
 4 |   DetectResOption,
 5 |   KeepInstancesOption,
 6 |   RenderTextDirOption,
 7 |   ScriptLangOption,
 8 |   TargetLangOption,
 9 |   TextDetectorOption,
10 |   TranslatorOption,
11 | } from '../settings'
12 | 
13 | export type GMSignal<T> = [
14 |   Accessor<T> & {
15 |     ready: Promise<void>
16 |     isReady: Accessor<boolean>
17 |   },
18 |   Setter<T | null | undefined>,
19 | ]
20 | 
21 | export function createGMSignal<T = string>(key: string): GMSignal<T | undefined>
22 | export function createGMSignal<T = string>(key: string, initialValue: T): GMSignal<T>
23 | export function createGMSignal<T>(key: string, initialValue?: T) {
24 |   const [signal, setSignal] = createSignal(initialValue) as GMSignal<T>
25 | 
26 |   let listener: number | undefined
27 | 
28 |   Promise.resolve()
29 |     .then(() => GMP.addValueChangeListener?.(key, (name, oldValue, newValue, remote) => {
30 |       if (name === key && (remote === undefined || remote === true))
31 |         read(newValue)
32 |     }))
33 |     .then(l => listener = l)
34 | 
35 |   let effectPaused = false
36 |   createEffect(on(signal, () => {
37 |     if (effectPaused)
38 |       return
39 |     if (signal() == null) {
40 |       GMP.deleteValue(key)
41 |       effectPaused = true
42 |       setSignal(() => initialValue)
43 |       effectPaused = false
44 |     }
45 |     else {
46 |       GMP.setValue(key, signal())
47 |     }
48 |   }, { defer: true }))
49 | 
50 |   async function read(newValue?: string) {
51 |     effectPaused = true
52 | 
53 |     const rawValue = newValue ?? (await GMP.getValue(key))
54 |     if (rawValue == null)
55 |       setSignal(() => initialValue)
56 |     else
57 |       setSignal(() => rawValue as T)
58 | 
59 |     effectPaused = false
60 |   }
61 | 
62 |   const [isReady, setIsReady] = createSignal(false)
63 |   signal.isReady = isReady
64 |   signal.ready = read()
65 |     .then(() => {
66 |       setIsReady(true)
67 |     })
68 | 
69 |   onCleanup(() => {
70 |     if (listener)
71 |       GMP.removeValueChangeListener?.(listener)
72 |   })
73 | 
74 |   return [signal, setSignal]
75 | }
76 | 
77 | export const [detectionResolution, setDetectionResolution] = createGMSignal<DetectResOption>('detectionResolution', 'M')
78 | export const [textDetector, setTextDetector] = createGMSignal<TextDetectorOption>('textDetector', 'default')
79 | export const [translatorService, setTranslatorService] = createGMSignal<TranslatorOption>('translator', 'gpt3.5')
80 | export const [renderTextOrientation, setRenderTextOrientation] = createGMSignal<RenderTextDirOption>('renderTextOrientation', 'auto')
81 | export const [targetLang, setTargetLang] = createGMSignal<TargetLangOption>('targetLang', '')
82 | export const [scriptLang, setScriptLang] = createGMSignal<ScriptLangOption>('scriptLanguage', '')
83 | export const [keepInstances, setKeepInstances] = createGMSignal<KeepInstancesOption>('keepInstances', 'until-reload')
84 | 
85 | export const storageReady = Promise.all([
86 |   detectionResolution.ready,
87 |   textDetector.ready,
88 |   translatorService.ready,
89 |   renderTextOrientation.ready,
90 |   targetLang.ready,
91 |   scriptLang.ready,
92 |   keepInstances.ready,
93 | ])
94 | 


--------------------------------------------------------------------------------
/userscript/src/utils/twind.ts:
--------------------------------------------------------------------------------
 1 | import { dom, twind } from '@twind/core'
 2 | import presetAutoprefix from '@twind/preset-autoprefix'
 3 | import presetTailwind from '@twind/preset-tailwind'
 4 | 
 5 | export const tw = twind({
 6 |   preflight: false,
 7 |   hash: (className, defaultHash) => {
 8 |     return `tw-${defaultHash(className).slice(1)}`
 9 |   },
10 |   presets: [
11 |     presetAutoprefix(),
12 |     presetTailwind({
13 |       disablePreflight: true,
14 |     }),
15 |   ],
16 | }, dom())
17 | 


--------------------------------------------------------------------------------
/userscript/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "ES2020",
 4 |     "useDefineForClassFields": true,
 5 |     "module": "ESNext",
 6 |     "lib": ["ESNext", "DOM"],
 7 |     "types": ["tampermonkey", "vitest", "unplugin-icons/types/solid"],
 8 |     "moduleResolution": "Node",
 9 |     "jsx": "preserve",
10 |     "jsxImportSource": "solid-js",
11 |     "strict": true,
12 |     "resolveJsonModule": true,
13 |     "esModuleInterop": true,
14 |     "noEmit": true,
15 |     "noImplicitReturns": true
16 |   },
17 |   "include": ["./src"]
18 | }
19 | 


--------------------------------------------------------------------------------
/userscript/vitest.config.ts:
--------------------------------------------------------------------------------
1 | export default {
2 |   test: {
3 |     environment: 'happy-dom',
4 |     globals: true,
5 |     // segment fault, idk
6 |     threads: false,
7 |   },
8 | }
9 | 


--------------------------------------------------------------------------------
/web/.gitignore:
--------------------------------------------------------------------------------
1 | node_modules
2 | *.log*
3 | .nuxt
4 | .nitro
5 | .cache
6 | .output
7 | .env
8 | dist
9 | 


--------------------------------------------------------------------------------
/web/app.vue:
--------------------------------------------------------------------------------
1 | <template>
2 |   <NuxtLoadingIndicator />
3 |   <NuxtLayout>
4 |     <NuxtPage />
5 |   </NuxtLayout>
6 | </template>
7 | 


--------------------------------------------------------------------------------
/web/components/footer/index.vue:
--------------------------------------------------------------------------------
 1 | <script setup lang="ts">
 2 | const config = useRuntimeConfig()
 3 | 
 4 | const visibility = useDocumentVisibility()
 5 | const { counter, pause, resume } = useInterval(15 * 1000, { controls: true })
 6 | watchEffect(() => {
 7 |   if (visibility.value === 'hidden') {
 8 |     pause()
 9 |   }
10 |   else {
11 |     counter.value++
12 |     resume()
13 |   }
14 | })
15 | 
16 | const { data: status } = useFetch<{
17 |   mit_worker: {
18 |     processing: number
19 |     queue: number
20 |     gc_queue: number
21 |     workers: number
22 |   }
23 | }>('/status/v1', {
24 |   baseURL: config.public.apiBase,
25 |   watch: [counter],
26 |   lazy: true,
27 | })
28 | </script>
29 | 
30 | <template>
31 |   <footer class="mx-1 font-quicksand">
32 |     <div class="flex justify-between items-center gap-x-4 text-sm text-zinc-700">
33 |       <div class="flex flex-wrap items-center gap-x-4">
34 |         <span class="flex-shrink-0">
35 |           &copy; 2021-2023 VoileLabs.
36 |           <a
37 |             href="https://choosealicense.com/licenses/gpl-3.0/"
38 |             target="_blank" rel="noopener noreferrer"
39 |           >
40 |             GPL-3.0.
41 |           </a>
42 |         </span>
43 |         <a
44 |           class="flex-shrink-0"
45 |           href="https://ko-fi.com/voilelabs"
46 |           target="_blank" rel="noopener noreferrer"
47 |         >
48 |           Ko-fi
49 |         </a>
50 |         <a
51 |           class="flex-shrink-0"
52 |           href="https://patreon.com/voilelabs"
53 |           target="_blank" rel="noopener noreferrer"
54 |         >
55 |           Patreon
56 |         </a>
57 |         <a
58 |           class="flex-shrink-0"
59 |           href="https://afdian.net/@voilelabs"
60 |           target="_blank" rel="noopener noreferrer"
61 |         >
62 |           Afdian
63 |         </a>
64 |         <a
65 |           class="flex-shrink-0"
66 |           href="https://github.com/VoileLabs/cotrans"
67 |           target="_blank" rel="noopener noreferrer"
68 |         >
69 |           Github
70 |         </a>
71 |         <a
72 |           class="flex-shrink-0"
73 |           href="https://discord.gg/975FRV8ca6"
74 |           target="_blank" rel="noopener noreferrer"
75 |         >
76 |           Discord
77 |         </a>
78 |       </div>
79 | 
80 |       <div v-if="status" class="hidden lg:block">
81 |         {{ status.mit_worker.workers }} workers
82 |         processing {{ status.mit_worker.processing }} images
83 |         with {{ status.mit_worker.queue }} queued
84 |         + {{ status.mit_worker.gc_queue }} low priority
85 |       </div>
86 |     </div>
87 |   </footer>
88 | </template>
89 | 


--------------------------------------------------------------------------------
/web/components/nav/index.vue:
--------------------------------------------------------------------------------
 1 | <script setup lang="ts">
 2 | 
 3 | </script>
 4 | 
 5 | <template>
 6 |   <nav class="flex items-end mx-2 mb-1 h-7 font-quicksand">
 7 |     <div class="flex-auto flex gap-4">
 8 |       <div class="text-zinc-800 font-semibold">
 9 |         Cotrans
10 |       </div>
11 | 
12 |       <NuxtLink class="nav-link" to="/">
13 |         Translator
14 |       </NuxtLink>
15 | 
16 |       <NuxtLink class="nav-link" target="_blank" to="https://greasyfork.org/scripts/437569">
17 |         UserScript
18 |       </NuxtLink>
19 | 
20 |       <NuxtLink class="nav-link" to="#">
21 |         Editor
22 |         <span class="inline-block px-2 py-.5 rounded-full text-xs text-fuchsia-600 font-bold leading-3 bg-fuchsia-100">
23 |           soon
24 |         </span>
25 |       </NuxtLink>
26 |     </div>
27 | 
28 |     <div class="flex-1 ml-auto">
29 |       <!-- TODO user -->
30 |     </div>
31 |   </nav>
32 | </template>
33 | 


--------------------------------------------------------------------------------
/web/components/u/Listbox.vue:
--------------------------------------------------------------------------------
  1 | <script lang="ts" setup>
  2 | const props = defineProps<{
  3 |   items: Record<string, string>
  4 |   modelValue: string
  5 |   class?: string
  6 | }>()
  7 | const emit = defineEmits<{
  8 |   (event: 'update:modelValue', value: string): void
  9 | }>()
 10 | 
 11 | const modelValue = useVModel(props, 'modelValue', emit)
 12 | 
 13 | const rootEl = shallowRef<HTMLDivElement | null>()
 14 | const optionsEl = shallowRef<HTMLDivElement | null>()
 15 | 
 16 | const rootPos = useElementBounding(rootEl, { immediate: true })
 17 | 
 18 | const diaOpen = ref(false)
 19 | function updateOpen(n: boolean) {
 20 |   diaOpen.value = n
 21 | }
 22 | watch(diaOpen, () => {
 23 |   rootPos.update()
 24 | }, { flush: 'pre' })
 25 | 
 26 | const optionsTop = computed(() => rootPos.top.value + rootPos.height.value)
 27 | const optionsBottom = computed(() => window.innerHeight - rootPos.top.value)
 28 | const optionsLeft = computed(() => rootPos.left.value)
 29 | const optionsHeight = computed(() => Math.min(window.innerHeight - optionsTop.value - 16, 240))
 30 | const toTop = computed(() => optionsHeight.value < 200 && optionsTop.value > (240 + rootPos.height.value))
 31 | </script>
 32 | 
 33 | <template>
 34 |   <HListbox v-slot="{ open }" v-model="modelValue">
 35 |     <!-- TODO remove this -->
 36 |     <div class="hidden" :data-todo="updateOpen(open)" />
 37 | 
 38 |     <div ref="rootEl" class="mt-1" :class="props.class">
 39 |       <HListboxButton class="focus:outline-none relative w-full py-1 pl-4 pr-8 rounded-full text-left shadow-sm ring-1 ring-fuchsia-300 dark:ring-gray-700 focus-visible:ring-offset-1 focus-visible:ring-offset-fuchsia-400 dark:focus-visible:ring-offset-gray-500">
 40 |         <span class="block truncate">{{ items[modelValue] }}</span>
 41 |         <span class="pointer-events-none absolute flex inset-y-0 right-0 pr-2 items-center">
 42 |           <span
 43 |             class="i-ri:arrow-down-s-line w-5 h-5 text-gray-400 transition-transform"
 44 |             :class="{ 'rotate-180': open }"
 45 |             aria-hidden="true"
 46 |           />
 47 |         </span>
 48 |       </HListboxButton>
 49 | 
 50 |       <Teleport to="body">
 51 |         <div
 52 |           ref="optionsEl"
 53 |           class="z-51 fixed -mx-1 py-2 px-1 rounded-md overflow-hidden"
 54 |           :style="{
 55 |             top: toTop ? undefined : `${optionsTop}px`,
 56 |             bottom: toTop ? `${optionsBottom}px` : undefined,
 57 |             left: `${optionsLeft}px`,
 58 |             width: `calc(${rootPos.width.value}px + 0.5rem)`,
 59 |           }"
 60 |         >
 61 |           <Transition
 62 |             enter-active-class="transition ease-out duration-85 transform"
 63 |             :enter-from-class="`${toTop ? 'translate-y-1/3' : '-translate-y-1/3'} opacity-40`"
 64 |             enter-to-class="translate-y-0 opacity-100"
 65 |             leave-active-class="transition ease-out duration-85 transform"
 66 |             leave-from-class="translate-y-0 opacity-100"
 67 |             :leave-to-class="`${toTop ? 'translate-y-1/3' : '-translate-y-1/3'} opacity-0`"
 68 |           >
 69 |             <HListboxOptions
 70 |               class="focus:outline-none w-full rounded-md overflow-auto text-base shadow ring-1 ring-gray-300 ring-opacity-10 bg-white dark:bg-gray-800"
 71 |               :style="{
 72 |                 maxHeight: toTop ? undefined : `${optionsHeight}px`,
 73 |               }"
 74 |             >
 75 |               <HListboxOption
 76 |                 v-for="(value, id) in items"
 77 |                 v-slot="{ active, selected }"
 78 |                 :key="id"
 79 |                 :value="id"
 80 |                 as="template"
 81 |               >
 82 |                 <li
 83 |                   class="relative py-1 pl-8 pr-4 cursor-pointer select-none"
 84 |                   :class="active ? 'bg-fuchsia-50 text-fuchsia-900 dark:bg-indigo-900 dark:text-fuchsia-50' : 'text-gray-900 dark:text-gray-100'"
 85 |                 >
 86 |                   <span
 87 |                     class="block truncate"
 88 |                     :class="selected ? 'font-medium' : 'font-normal'"
 89 |                   >{{ value }}</span>
 90 |                   <span
 91 |                     v-if="selected"
 92 |                     class="absolute inset-y-0 left-0 flex items-center pl-2.5 text-fuchsia-600 dark:text-fuchsia-300"
 93 |                   ><span class="i-ri:check-line h-4 w-4" aria-hidden="true" /></span>
 94 |                 </li>
 95 |               </HListboxOption>
 96 |             </HListboxOptions>
 97 |           </Transition>
 98 |         </div>
 99 |       </Teleport>
100 |     </div>
101 |   </HListbox>
102 | </template>
103 | 


--------------------------------------------------------------------------------
/web/layouts/default.vue:
--------------------------------------------------------------------------------
 1 | <script setup lang="ts">
 2 | </script>
 3 | 
 4 | <template>
 5 |   <div class="flex flex-col w-full h-full">
 6 |     <Nav />
 7 | 
 8 |     <slot />
 9 | 
10 |     <Footer />
11 |   </div>
12 | </template>
13 | 
14 | <style>
15 | html,
16 | body,
17 | #__nuxt {
18 |   width: 100%;
19 |   height: 100%;
20 | }
21 | </style>
22 | 


--------------------------------------------------------------------------------
/web/nuxt.config.ts:
--------------------------------------------------------------------------------
 1 | // https://v3.nuxtjs.org/api/configuration/nuxt.config
 2 | export default defineNuxtConfig({
 3 |   ssr: false,
 4 | 
 5 |   modules: [
 6 |     '@vueuse/nuxt',
 7 |     '@unocss/nuxt',
 8 |     'nuxt-headlessui',
 9 |   ],
10 | 
11 |   typescript: {
12 |     strict: true,
13 |   },
14 | 
15 |   runtimeConfig: {
16 |     public: {
17 |       apiBase: 'https://api.cotrans.touhou.ai',
18 |       wsBase: 'wss://api.cotrans.touhou.ai',
19 |     },
20 |   },
21 | 
22 |   unocss: {
23 |     preflight: true,
24 |     uno: true,
25 |     icons: {
26 |       scale: 1.2,
27 |       extraProperties: {
28 |         'color': 'inherit',
29 |         // Avoid crushing of icons in crowded situations
30 |         'min-width': '1.2em',
31 |       },
32 |     },
33 |     webFonts: {
34 |       provider: 'google',
35 |       fonts: {
36 |         quicksand: 'Quicksand:300,400,500,600,700',
37 |       },
38 |     },
39 |     shortcuts: [
40 |       [
41 |         'nav-link',
42 |         [
43 |           'absolute',
44 |           'content-empty',
45 |           'left-0',
46 |           'bottom-0',
47 |           'w-full',
48 |           'h-px',
49 |           'opacity-0',
50 |           'bg-gradient-to-r',
51 |           'from-fuchsia-600',
52 |           'to-pink-600',
53 |           'transform',
54 |           '-translate-y-1',
55 |           'transition-all',
56 |           'ease-out',
57 |           'hover:opacity-60',
58 |           'hover:translate-y-0',
59 |         ]
60 |           .map(c => `after:${c}`)
61 |           .concat([
62 |             'relative',
63 |           ])
64 |           .join(' '),
65 |       ],
66 |     ],
67 |   },
68 | 
69 |   headlessui: {
70 |     prefix: 'H',
71 |   },
72 | })
73 | 


--------------------------------------------------------------------------------
/web/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "private": true,
 3 |   "scripts": {
 4 |     "build": "nuxt build",
 5 |     "dev": "nuxt dev",
 6 |     "generate": "nuxt generate",
 7 |     "preview": "nuxt preview",
 8 |     "postinstall": "nuxt prepare"
 9 |   },
10 |   "devDependencies": {
11 |     "@iconify-json/ri": "^1.1.10",
12 |     "@unocss/nuxt": "^0.53.6",
13 |     "@vueuse/core": "^10.2.1",
14 |     "@vueuse/nuxt": "^10.2.1",
15 |     "nuxt": "^3.6.5",
16 |     "nuxt-headlessui": "^1.1.4"
17 |   }
18 | }
19 | 


--------------------------------------------------------------------------------
/web/pages/userscript.vue:
--------------------------------------------------------------------------------
 1 | <script setup lang="ts">
 2 | 
 3 | </script>
 4 | 
 5 | <template>
 6 |   <div>
 7 |     hi!
 8 |   </div>
 9 | </template>
10 | 


--------------------------------------------------------------------------------
/web/tsconfig.json:
--------------------------------------------------------------------------------
1 | {
2 |   // https://v3.nuxtjs.org/concepts/typescript
3 |   "extends": "./.nuxt/tsconfig.json"
4 | }
5 | 


--------------------------------------------------------------------------------
/wk-gateway/.gitignore:
--------------------------------------------------------------------------------
1 | /dist/
2 | 


--------------------------------------------------------------------------------
/wk-gateway/buf.gen.yaml:
--------------------------------------------------------------------------------
1 | # Learn more: https://docs.buf.build/configuration/v1/buf-gen-yaml
2 | version: v1
3 | plugins:
4 |   - plugin: es
5 |     opt: target=ts
6 |     out: src/protoGen
7 | 


--------------------------------------------------------------------------------
/wk-gateway/build.config.ts:
--------------------------------------------------------------------------------
 1 | import { defineBuildConfig } from 'unbuild'
 2 | import { version } from './package.json'
 3 | import { dbEnum } from './src/db'
 4 | 
 5 | function flattenObject(
 6 |   obj: Record<string, any>,
 7 |   parentKey = '',
 8 |   result: Record<string, unknown> = {},
 9 | ) {
10 |   for (const key in obj) {
11 |     if (Object.hasOwn(obj, key)) {
12 |       const propName = parentKey ? `${parentKey}.${key}` : key
13 |       if (
14 |         (typeof obj[key] === 'object' && obj[key] !== null)
15 |         || typeof obj[key] === 'function'
16 |       )
17 |         flattenObject(obj[key], propName, result)
18 |       else
19 |         result[propName] = JSON.stringify(obj[key])
20 |     }
21 |   }
22 |   return result
23 | }
24 | 
25 | export default defineBuildConfig({
26 |   entries: [
27 |     { input: 'src/index.ts', name: 'index' },
28 |     { input: 'src/mitWorker/dObject.ts', name: 'doMitWorker' },
29 |   ],
30 |   declaration: true,
31 |   replace: {
32 |     'import.meta.env.VERSION': JSON.stringify(version),
33 |     'import.meta.env.BUILD_TIME': JSON.stringify(new Date().toISOString()),
34 |     ...flattenObject(dbEnum, 'dbEnum'),
35 |   },
36 |   rollup: {
37 |     inlineDependencies: true,
38 |     resolve: {
39 |       exportConditions: ['browser'],
40 |     },
41 |   },
42 |   hooks: {
43 |     'rollup:options': (ctx, opt) => {
44 |       const external = opt.external
45 |       opt.external = []
46 |       ctx.hooks.hook('rollup:dts:options', (ctx, opt) => {
47 |         opt.external = external
48 |       })
49 |     },
50 |   },
51 | })
52 | 


--------------------------------------------------------------------------------
/wk-gateway/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "version": "0.1.0",
 3 |   "private": true,
 4 |   "main": "dist/index.mjs",
 5 |   "types": "dist/index.d.ts",
 6 |   "scripts": {
 7 |     "build": "unbuild",
 8 |     "postinstall": "rimraf src/protoGen && buf generate ../proto"
 9 |   },
10 |   "dependencies": {
11 |     "@bufbuild/protobuf": "^1.3.0",
12 |     "@paralleldrive/cuid2": "^2.2.1",
13 |     "hono": "^3.3.2",
14 |     "jose": "^4.14.4",
15 |     "ofetch": "^1.1.1",
16 |     "zod": "^3.21.4"
17 |   },
18 |   "devDependencies": {
19 |     "@bufbuild/buf": "^1.25.0",
20 |     "@bufbuild/protoc-gen-es": "^1.3.0",
21 |     "@cloudflare/workers-types": "^4.20230717.1",
22 |     "@cotrans/types": "workspace:^",
23 |     "@types/node": "^20.4.4",
24 |     "rimraf": "^5.0.1",
25 |     "unbuild": "^1.2.1"
26 |   }
27 | }
28 | 


--------------------------------------------------------------------------------
/wk-gateway/shims.d.ts:
--------------------------------------------------------------------------------
1 | interface ImportMeta {
2 |   env: ImportMetaEnv
3 | }
4 | 
5 | interface ImportMetaEnv {
6 |   VERSION: string
7 |   BUILD_TIME: string
8 | }
9 | 


--------------------------------------------------------------------------------
/wk-gateway/src/db.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @example
 3 |  * const en = createEnum(['!removed', '~deprecated', 'normal'])
 4 |  * en.removed // never
 5 |  * en.deprecated // never
 6 |  * en.normal // 3
 7 |  * en(number) // 'normal' | 'deprecated'
 8 |  * type Union = keyof typeof en // 'normal'
 9 |  * type UnionDeprecated = ReturnType<typeof en> // 'normal' | 'deprecated'
10 |  */
11 | function createEnum<
12 |   const T extends readonly string[],
13 |   K extends T[number],
14 |   U extends Range<T['length']>,
15 | >(values: T):
16 | & { [I in U as Exclude<T[I], `~${string}` | `!${string}`>]: PlusOne<I> }
17 | & ((i: number) => K extends `~${infer S}` ? S : Exclude<K, `!${string}`>) {
18 |   const reverse = values.map(v => v[0] === '!' ? undefined : v[0] === '~' ? v.slice(1) : v)
19 |   return Object.assign(
20 |     (i: number) => reverse[i - 1],
21 |     Object.fromEntries(
22 |       values
23 |         .filter(v => v[0] !== '~' && v[0] !== '!')
24 |         .map((v, i) => [v, i + 1]),
25 |     ),
26 |   ) as never
27 | }
28 | type Range<N, C extends 0[] = [0], I = 0> =
29 |   C['length'] extends N ? I : Range<N, [...C, 0], C['length'] | I>
30 | type PlusOne<N, C extends 0[] = [0], B extends 0[] = []> =
31 |   B['length'] extends N ? C['length'] : PlusOne<N, [...C, 0], C>
32 | 
33 | export const dbEnum = {
34 |   taskState: createEnum(['pending', 'running', 'done', 'error']),
35 |   taskLanguage: createEnum(['CHS', 'CHT', 'CSY', 'NLD', 'ENG', 'FRA', 'DEU', 'HUN', 'ITA', 'JPN', 'KOR', 'PLK', 'PTB', 'ROM', 'RUS', 'ESP', 'TRK', 'UKR', 'VIN']),
36 |   taskDetector: createEnum(['default', 'ctd']),
37 |   taskDirection: createEnum(['auto', 'h', 'v']),
38 |   taskTranslator: createEnum(['gpt3.5', 'youdao', 'baidu', 'google', 'deepl', 'papago', 'offline', 'none', 'original']),
39 |   taskSize: createEnum(['S', 'M', 'L', 'X']),
40 | }
41 | 


--------------------------------------------------------------------------------
/wk-gateway/src/index.ts:
--------------------------------------------------------------------------------
 1 | import { Hono } from 'hono'
 2 | import { cors } from 'hono/cors'
 3 | import { HTTPException } from 'hono/http-exception'
 4 | import { ofetch } from 'ofetch'
 5 | import type { Bindings } from './types'
 6 | import { taskApp } from './task'
 7 | import { mitWorkerApp } from './mitWorker'
 8 | 
 9 | const CORS_ORIGINS: (string | RegExp)[] = [
10 |   /https?:\/\/localhost(?::\d+)?/,
11 |   'https://cotrans.touhou.ai',
12 | ]
13 | 
14 | const app = new Hono<{ Bindings: Bindings }>()
15 |   .use('*', cors({
16 |     origin: origin =>
17 |       CORS_ORIGINS.some(
18 |         o => typeof o === 'string'
19 |           ? o === origin
20 |           : o.test(origin),
21 |       )
22 |         ? origin
23 |         : null,
24 |     allowMethods: ['GET', 'POST', 'PUT', 'PATCH', 'DELETE', 'OPTIONS'],
25 |     maxAge: 10 * 60,
26 |   }))
27 |   .get('/', ({ text }) => text(`Cotrans API by VoileLabs ${import.meta.env.VERSION}`))
28 |   .get('/status/v1', async ({ env, json }) => {
29 |     const mitWorkerId = env.doMitWorker.idFromName('default')
30 |     const mitWorker = await ofetch('https://fake-host/status', {
31 |       fetcher: env.doMitWorker.get(mitWorkerId, { locationHint: 'enam' }),
32 |     })
33 |     return json({
34 |       version: import.meta.env.VERSION,
35 |       build_time: import.meta.env.BUILD_TIME,
36 |       mit_worker: mitWorker,
37 |     })
38 |   })
39 |   .route('/task', taskApp)
40 |   .route('/mit', mitWorkerApp)
41 |   .onError((err) => {
42 |     if (err instanceof HTTPException) {
43 |       // get the custom response
44 |       return err.getResponse()
45 |     }
46 | 
47 |     console.error(String(err instanceof Error ? (err.stack ?? err) : err))
48 | 
49 |     // return a generic response
50 |     return new Response('Internal Server Error', { status: 500 })
51 |   })
52 | 
53 | export default app
54 | 


--------------------------------------------------------------------------------
/wk-gateway/src/mitWorker/id.ts:
--------------------------------------------------------------------------------
 1 | // k-sortable time based id generator
 2 | // with some help from ChatGPT, obviously
 3 | 
 4 | import { memo } from '../utils'
 5 | 
 6 | const characters = '0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz'
 7 | 
 8 | function convertToBase62(num: number) {
 9 |   let result = ''
10 |   do {
11 |     result = characters[num % 62] + result
12 |     num = Math.floor(num / 62)
13 |   } while (num > 0)
14 |   return result
15 | }
16 | 
17 | let sequenceNumber = 0
18 | 
19 | const machineId = memo(() => {
20 |   // Generating a unique random machine identifier using crypto.getRandomValues
21 |   const array = new Uint8Array(3)
22 |   crypto.getRandomValues(array)
23 |   return Array.from(array).map(b => (`0${b.toString(16)}`).slice(-2)).join('')
24 | })
25 | 
26 | export function createSortableId() {
27 |   const timestamp = new Date().getTime()
28 | 
29 |   // Increment sequence number and reset if it's too large
30 |   sequenceNumber = (sequenceNumber + 1) & 0xFFFFFF
31 | 
32 |   const base62Timestamp = convertToBase62(timestamp)
33 |   const base62Sequence = convertToBase62(sequenceNumber).padStart(2, '0')
34 | 
35 |   // Combine timestamp, machineId, and sequenceNumber
36 |   return base62Timestamp + machineId() + base62Sequence
37 | }
38 | 


--------------------------------------------------------------------------------
/wk-gateway/src/mitWorker/index.ts:
--------------------------------------------------------------------------------
 1 | import { Hono } from 'hono'
 2 | import type { Bindings } from '../types'
 3 | 
 4 | export const mitWorkerApp = new Hono<{ Bindings: Bindings }>()
 5 |   .get('/worker_ws', async ({ env, req }) => {
 6 |     if (req.header('Upgrade') !== 'websocket')
 7 |       return new Response('Not a websocket request', { status: 400 })
 8 | 
 9 |     const encoder = new TextEncoder()
10 |     if (!req.header('x-secret'))
11 |       return new Response('Forbidden', { status: 403 })
12 |     // @ts-expect-error Cloudflare only
13 |     if (!crypto.subtle.timingSafeEqual(
14 |       encoder.encode(req.header('x-secret')!),
15 |       encoder.encode(env.MIT_WORKERS_SECRET),
16 |     ))
17 |       return new Response('Forbidden', { status: 403 })
18 | 
19 |     // pass the request to durable object
20 |     const id = env.doMitWorker.idFromName('default')
21 |     return env.doMitWorker.get(id, { locationHint: 'enam' })
22 |       .fetch('https://fake-host/worker_ws', req.raw)
23 |       .then(res => new Response(res.body, res))
24 |   })
25 | 


--------------------------------------------------------------------------------
/wk-gateway/src/mitWorker/ttl.ts:
--------------------------------------------------------------------------------
 1 | export class TTLSet<T> implements Set<T> {
 2 |   private map: Map<T, number> = new Map()
 3 |   private generatorPair: () => IterableIterator<[T, T]>
 4 |   private generator: () => IterableIterator<T>
 5 |   private lastCleanedAt = Date.now()
 6 | 
 7 |   constructor(public ttl: number) {
 8 |     const map = this.map
 9 |     this.generatorPair = function* (): IterableIterator<[T, T]> {
10 |       const l = Date.now() - ttl
11 |       for (const [key, t] of map.entries()) {
12 |         if (t > l)
13 |           yield [key, key]
14 |       }
15 |     }
16 |     this.generator = function* (): IterableIterator<T> {
17 |       const l = Date.now() - ttl
18 |       for (const [key, t] of map.entries()) {
19 |         if (t > l)
20 |           yield key
21 |       }
22 |     }
23 |   }
24 | 
25 |   add(value: T): this {
26 |     const t = Date.now()
27 | 
28 |     if (t - this.lastCleanedAt > this.ttl) {
29 |       this.lastCleanedAt = t
30 |       for (const [key, t] of this.map.entries()) {
31 |         if (t + this.ttl < t)
32 |           this.map.delete(key)
33 |       }
34 |     }
35 | 
36 |     this.map.set(value, t)
37 |     return this
38 |   }
39 | 
40 |   clear(): void {
41 |     this.map.clear()
42 |   }
43 | 
44 |   delete(value: T): boolean {
45 |     return this.map.delete(value)
46 |   }
47 | 
48 |   forEach(callbackfn: (value: T, value2: T, set: Set<T>) => void, thisArg?: any): void {
49 |     this.map.forEach((_, key) => callbackfn(key, key, this), thisArg)
50 |   }
51 | 
52 |   has(value: T): boolean {
53 |     return (this.map.get(value) ?? 0) + this.ttl > Date.now()
54 |   }
55 | 
56 |   get size(): number {
57 |     return this.map.size
58 |   }
59 | 
60 |   [Symbol.iterator](): IterableIterator<T> {
61 |     return this.generator()
62 |   }
63 | 
64 |   entries(): IterableIterator<[T, T]> {
65 |     return this.generatorPair()
66 |   }
67 | 
68 |   keys(): IterableIterator<T> {
69 |     return this.generator()
70 |   }
71 | 
72 |   values(): IterableIterator<T> {
73 |     return this.generator()
74 |   }
75 | 
76 |   [Symbol.toStringTag] = 'TTLSet'
77 | }
78 | 


--------------------------------------------------------------------------------
/wk-gateway/src/task/index.ts:
--------------------------------------------------------------------------------
  1 | import { Hono } from 'hono'
  2 | import { ofetch } from 'ofetch'
  3 | import type { QueryV1Message, QueryV1MessageNotFound } from '@cotrans/types'
  4 | import type { Bindings } from '../types'
  5 | import { dbEnum } from '../db'
  6 | import { BLANK_PNG } from '../utils'
  7 | import { upload } from './upload'
  8 | 
  9 | export const taskApp = new Hono<{ Bindings: Bindings }>()
 10 |   .post('/upload/v1', upload)
 11 |   .put('/upload/v1', upload)
 12 |   .get('/group/:group/event/v1', async ({ env, req }) => {
 13 |     const group = req.param('group')
 14 | 
 15 |     if (req.header('Upgrade') !== 'websocket')
 16 |       throw new Error('Not a websocket request')
 17 | 
 18 |     const mitWorkerId = env.doMitWorker.idFromName('default')
 19 |     return await env.doMitWorker
 20 |       .get(mitWorkerId, { locationHint: 'enam' })
 21 |       .fetch(`https://fake-host/group/event/${group}`, req.raw)
 22 |       .then(res => new Response(res.body, res))
 23 |   })
 24 |   .get('/:id/status/v1', async ({ env, req, json }) => {
 25 |     const id = req.param('id')
 26 | 
 27 |     const mitWorkerId = env.doMitWorker.idFromName('default')
 28 |     const mitWorkerResult = await ofetch<QueryV1Message>(`https://fake-host/status/${id}`, {
 29 |       fetcher: env.doMitWorker.get(mitWorkerId, { locationHint: 'enam' }),
 30 |     })
 31 | 
 32 |     if (mitWorkerResult.type !== 'not_found')
 33 |       return json(mitWorkerResult)
 34 | 
 35 |     const dbResult = await env.DB
 36 |       .prepare('SELECT state, translation_mask FROM task WHERE id = ?')
 37 |       .bind(id)
 38 |       .first<{ state: number; translation_mask: string } | null>()
 39 | 
 40 |     if (!dbResult)
 41 |       return json({ type: 'not_found' } satisfies QueryV1Message)
 42 | 
 43 |     if (dbResult.state === dbEnum.taskState.done) {
 44 |       return json({
 45 |         type: 'result',
 46 |         result: {
 47 |           translation_mask: dbResult.translation_mask
 48 |             ? `${env.WKR2_PUBLIC_EXPOSED_BASE}/${dbResult.translation_mask}`
 49 |             : BLANK_PNG,
 50 |         },
 51 |       } satisfies QueryV1Message)
 52 |     }
 53 |     else if (dbResult.state === dbEnum.taskState.error) {
 54 |       return json({ type: 'error' } satisfies QueryV1Message)
 55 |     }
 56 |     else {
 57 |       return json({
 58 |         type: 'status',
 59 |         status: 'pending',
 60 |       } satisfies QueryV1Message)
 61 |     }
 62 |   })
 63 |   .get('/:id/event/v1', async ({ env, req }) => {
 64 |     const id = req.param('id')
 65 | 
 66 |     if (req.header('Upgrade') !== 'websocket')
 67 |       throw new Error('Not a websocket request')
 68 | 
 69 |     const mitWorkerId = env.doMitWorker.idFromName('default')
 70 |     const mitWorkerResult = await env.doMitWorker
 71 |       .get(mitWorkerId, { locationHint: 'enam' })
 72 |       .fetch(`https://fake-host/event/${id}`, req.raw)
 73 | 
 74 |     if (mitWorkerResult.status === 101)
 75 |       return new Response(mitWorkerResult.body, mitWorkerResult)
 76 | 
 77 |     const status = await mitWorkerResult.json<QueryV1MessageNotFound>()
 78 |     if (status.type === 'not_found') {
 79 |       const dbResult = await env.DB
 80 |         .prepare('SELECT state, translation_mask FROM task WHERE id = ?')
 81 |         .bind(id)
 82 |         .first<{ state: number; translation_mask: string | null } | null>()
 83 | 
 84 |       const sendAndClose = (data: QueryV1Message) => {
 85 |         const pair = new WebSocketPair()
 86 |         // @ts-expect-error Cloudflare only
 87 |         pair[1].accept()
 88 |         pair[1].send(JSON.stringify(data))
 89 |         pair[1].close()
 90 |         return new Response(null, { status: 101, webSocket: pair[0] })
 91 |       }
 92 | 
 93 |       if (!dbResult)
 94 |         return sendAndClose({ type: 'not_found' })
 95 | 
 96 |       if (dbResult.state === dbEnum.taskState.done) {
 97 |         return sendAndClose({
 98 |           type: 'result',
 99 |           result: {
100 |             translation_mask: dbResult.translation_mask
101 |               ? `${env.WKR2_PUBLIC_EXPOSED_BASE}/${dbResult.translation_mask}`
102 |               : BLANK_PNG,
103 |           },
104 |         })
105 |       }
106 |       else if (dbResult.state === dbEnum.taskState.error) {
107 |         return sendAndClose({ type: 'error' })
108 |       }
109 |       else {
110 |         return sendAndClose({
111 |           type: 'status',
112 |           status: 'pending',
113 |         })
114 |       }
115 |     }
116 |     else {
117 |       throw new Error('Unexpected response')
118 |     }
119 |   })
120 | 


--------------------------------------------------------------------------------
/wk-gateway/src/types.ts:
--------------------------------------------------------------------------------
 1 | // FIXME Type '{ Bindings: Bindings; }' does not satisfy the constraint 'Env'.
 2 | // Types of property 'Bindings' are incompatible.
 3 | // eslint-disable-next-line @typescript-eslint/consistent-type-definitions
 4 | export type Bindings = {
 5 |   // TODO use mTLS
 6 |   MIT_WORKERS_SECRET: string
 7 | 
 8 |   JWT_PRIVATE_KEY: string
 9 |   JWT_PUBLIC_KEY: string
10 | 
11 |   WKR2_PRIVATE_BASE: string
12 |   WKR2_PUBLIC_BASE: string
13 |   WKR2_PUBLIC_EXPOSED_BASE: string
14 | 
15 |   DB: D1Database
16 |   doMitWorker: DurableObjectNamespace
17 |   doImage: DurableObjectNamespace
18 |   wkr2_private: Fetcher
19 |   wkr2_public: Fetcher
20 | }
21 | 


--------------------------------------------------------------------------------
/wk-gateway/src/utils/index.ts:
--------------------------------------------------------------------------------
1 | export * from './memo'
2 | export * from './png'
3 | 


--------------------------------------------------------------------------------
/wk-gateway/src/utils/memo.ts:
--------------------------------------------------------------------------------
1 | export function memo<T>(fn: () => NonNullable<T>): () => NonNullable<T> {
2 |   let cache: T
3 |   return () => cache ??= fn()
4 | }
5 | 


--------------------------------------------------------------------------------
/wk-gateway/src/utils/png.ts:
--------------------------------------------------------------------------------
1 | export const BLANK_PNG = 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVQI12NgYAAAAAMAASDVlMcAAAAASUVORK5CYII='
2 | 


--------------------------------------------------------------------------------
/wk-gateway/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "baseUrl": ".",
 4 |     "module": "ESNext",
 5 |     "target": "ESNext",
 6 |     "lib": ["ESNext", "DOM", "DOM.Iterable"],
 7 |     "types": ["@cloudflare/workers-types"],
 8 |     "strict": true,
 9 |     "esModuleInterop": true,
10 |     "skipLibCheck": true,
11 |     "moduleResolution": "node",
12 |     "jsx": "preserve",
13 |     "resolveJsonModule": true,
14 |     "strictNullChecks": true,
15 |     "forceConsistentCasingInFileNames": true,
16 |     "paths": {
17 |       "@/*": ["*"]
18 |     }
19 |   },
20 |   "include": ["**/*.ts"],
21 |   "exclude": ["dist", "node_modules"]
22 | }
23 | 


--------------------------------------------------------------------------------
/wk-gateway/wrangler.domitworker.toml:
--------------------------------------------------------------------------------
 1 | name = 'cotrans-wk-gateway-domitworker'
 2 | main = 'dist/doMitWorker.mjs'
 3 | compatibility_date = '2023-07-09'
 4 | compatibility_flags = []
 5 | workers_dev = false
 6 | usage_model = 'bundled'
 7 | 
 8 | [[migrations]]
 9 | tag = "v1"
10 | new_classes = ["DOMitWorker"]
11 | 
12 | [durable_objects]
13 | bindings = [{ name = "doMitWorker", class_name = "DOMitWorker" }]
14 | 
15 | [[d1_databases]]
16 | binding = "DB"
17 | database_name = "cotrans"
18 | database_id = "5586b253-f5be-44cc-9ae4-284029d78da0"
19 | migrations_dir = "../migrations"
20 | 


--------------------------------------------------------------------------------
/wk-gateway/wrangler.toml:
--------------------------------------------------------------------------------
 1 | name = 'cotrans-wk-gateway'
 2 | main = 'dist/index.mjs'
 3 | compatibility_date = '2023-07-09'
 4 | compatibility_flags = []
 5 | workers_dev = false
 6 | usage_model = 'bundled'
 7 | services = [
 8 |   { binding = "wkr2_private", service = "cotrans-wkr2-private" },
 9 |   { binding = "wkr2_public", service = "cotrans-wkr2-public" },
10 | ]
11 | 
12 | [durable_objects]
13 | bindings = [
14 |   { name = "doMitWorker", class_name = "DOMitWorker", script_name = "cotrans-wk-gateway-domitworker" },
15 |   { name = "doImage", class_name = "DOImage", script_name = "cotrans-wk-image" },
16 | ]
17 | 
18 | [[d1_databases]]
19 | binding = "DB"
20 | database_name = "cotrans"
21 | database_id = "5586b253-f5be-44cc-9ae4-284029d78da0"
22 | migrations_dir = "../migrations"
23 | 
24 | [placement]
25 | mode = "smart"
26 | 


--------------------------------------------------------------------------------
/wk-image/.gitignore:
--------------------------------------------------------------------------------
1 | /build/
2 | 


--------------------------------------------------------------------------------
/wk-image/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "cotrans-wk-image"
 3 | version = "0.1.0"
 4 | edition.workspace = true
 5 | rust-version.workspace = true
 6 | publish = false
 7 | 
 8 | [lib]
 9 | crate-type = ["cdylib"]
10 | 
11 | [dependencies]
12 | once_cell = "1.18.0"
13 | hex = "0.4.3"
14 | serde = { version = "1.0.174", features = ["derive"] }
15 | serde_json = "1.0.103"
16 | console_error_panic_hook = "0.1.7"
17 | web-sys = { version = "=0.3.61", features = ["File", "Crypto", "SubtleCrypto"] }
18 | worker-sys = "0.0.9"
19 | worker = "0.0.17"
20 | 
21 | image = "0.24.6"
22 | fast_image_resize = "2.7.3"
23 | image_hasher = { version = "1.2.0", path = "../img_hash", features = [
24 |   "nightly",
25 | ] }
26 | 
27 | [package.metadata.wasm-pack.profile.release]
28 | wasm-opt = false
29 | 


--------------------------------------------------------------------------------
/wk-image/package.json:
--------------------------------------------------------------------------------
1 | {
2 |   "private": true
3 | }
4 | 


--------------------------------------------------------------------------------
/wk-image/src/lib.rs:
--------------------------------------------------------------------------------
  1 | use std::{io::Cursor, num::NonZeroU32};
  2 | 
  3 | use console_error_panic_hook::set_once as set_panic_hook;
  4 | use fast_image_resize as fr;
  5 | use image::{
  6 |   codecs::png::{CompressionType, PngEncoder},
  7 |   io::Reader as ImageReader,
  8 |   DynamicImage, ImageEncoder, ImageFormat,
  9 | };
 10 | use image_hasher::{Hasher, HasherConfig};
 11 | use js_sys::{ArrayBuffer, Uint8Array};
 12 | use once_cell::sync::Lazy;
 13 | use serde::Serialize;
 14 | use wasm_bindgen::prelude::*;
 15 | use wasm_bindgen_futures::JsFuture;
 16 | use worker::*;
 17 | use worker_sys::R2Bucket;
 18 | 
 19 | static HASHER: Lazy<Hasher> = Lazy::new(|| {
 20 |   HasherConfig::new()
 21 |     .hash_size(10, 10)
 22 |     .resize_filter(image_hasher::FilterType::Lanczos3)
 23 |     .preproc_dct()
 24 |     .to_hasher()
 25 | });
 26 | 
 27 | pub fn hash_image(image: &DynamicImage) -> String {
 28 |   let hash = HASHER.hash_image(image);
 29 |   hex::encode(hash.as_bytes())
 30 | }
 31 | 
 32 | #[durable_object]
 33 | pub struct DOImage {
 34 |   env: Env,
 35 | }
 36 | 
 37 | #[durable_object]
 38 | impl DurableObject for DOImage {
 39 |   fn new(state: State, env: Env) -> Self {
 40 |     Self { env }
 41 |   }
 42 | 
 43 |   async fn fetch(&mut self, req: Request) -> Result<Response> {
 44 |     handle(req, &self.env).await
 45 |   }
 46 | }
 47 | 
 48 | #[derive(Serialize)]
 49 | struct ResponseJson {
 50 |   key: String,
 51 |   width: u32,
 52 |   height: u32,
 53 |   size: usize,
 54 |   hash: String,
 55 |   sha: String,
 56 | }
 57 | 
 58 | async fn handle(mut req: Request, env: &Env) -> Result<Response> {
 59 |   set_panic_hook();
 60 |   let worker: web_sys::WorkerGlobalScope = js_sys::global().unchecked_into();
 61 |   let bucket_pri: R2Bucket = js_sys::Reflect::get(env, &JsValue::from("BUCKET_PRI"))
 62 |     .unwrap()
 63 |     .unchecked_into();
 64 | 
 65 |   let form = req.form_data().await?;
 66 | 
 67 |   let Some(FormEntry::File(file)) = form.get("file") else {
 68 |     return Response::error("No file found", 400);
 69 |   };
 70 |   let file = file.bytes().await?;
 71 | 
 72 |   let mime = match form.get("mime") {
 73 |     Some(FormEntry::Field(mime)) => Some(mime),
 74 |     _ => None,
 75 |   };
 76 | 
 77 |   drop(form);
 78 | 
 79 |   let cursor = Cursor::new(file);
 80 |   let mut image = match mime {
 81 |     Some(mime) if !mime.is_empty() => {
 82 |       let Some(format) = ImageFormat::from_mime_type(mime) else {
 83 |         return Response::error("Invalid MIME type", 400);
 84 |       };
 85 |       let Ok(image) = ImageReader::with_format(cursor, format).decode() else {
 86 |         return Response::error("Invalid image", 400);
 87 |       };
 88 |       image
 89 |     }
 90 |     _ => {
 91 |       let Ok(reader) = ImageReader::new(cursor).with_guessed_format() else {
 92 |         return Response::error("Could not guess image format", 400);
 93 |       };
 94 |       let Ok(image) = reader.decode() else {
 95 |         return Response::error("Invalid image", 400);
 96 |       };
 97 |       image
 98 |     }
 99 |   };
100 | 
101 |   let mut width = image.width();
102 |   let mut height = image.height();
103 | 
104 |   image = match image {
105 |     DynamicImage::ImageRgb8(_) => image,
106 |     DynamicImage::ImageRgba8(_) => image,
107 |     DynamicImage::ImageLuma8(_) => image,
108 |     DynamicImage::ImageLumaA8(_) => image,
109 |     _ => DynamicImage::ImageRgba8(image.to_rgba8()),
110 |   };
111 | 
112 |   // scale image to less than 6000x6000
113 |   if width > 6000 || height > 6000 {
114 |     let widthf: f64 = width as f64;
115 |     let heightf: f64 = height as f64;
116 | 
117 |     let (nwidth, nheight) = if widthf > heightf {
118 |       (6000, (6000. / widthf * heightf).round() as u32)
119 |     } else {
120 |       ((6000. / heightf * widthf).round() as u32, 6000)
121 |     };
122 | 
123 |     image = resize(image, nwidth, nheight);
124 | 
125 |     width = nwidth;
126 |     height = nheight;
127 |   }
128 | 
129 |   // sha using SubtleCrypto
130 |   let sha: ArrayBuffer = JsFuture::from(
131 |     worker
132 |       .crypto()?
133 |       .subtle()
134 |       .digest_with_str_and_buffer_source(
135 |         "SHA-256",
136 |         &unsafe { Uint8Array::view(image.as_bytes()) }.into(),
137 |       )?,
138 |   )
139 |   .await?
140 |   .unchecked_into();
141 |   let sha = hex::encode(Uint8Array::new(&sha).to_vec());
142 | 
143 |   let mut png_buf: Vec<u8> = vec![];
144 |   if let Err(_) = PngEncoder::new_with_quality(
145 |     &mut Cursor::new(&mut png_buf),
146 |     CompressionType::Fast,
147 |     image::codecs::png::FilterType::default(),
148 |   )
149 |   .write_image(image.as_bytes(), width, height, image.color())
150 |   {
151 |     return Response::error("Could not encode image", 500);
152 |   };
153 | 
154 |   let size = png_buf.len();
155 | 
156 |   let key = "upload/".to_owned() + &sha + ".png";
157 |   let put_res = JsFuture::from(bucket_pri.put(
158 |     key.clone(),
159 |     unsafe { Uint8Array::view(&png_buf).into() },
160 |     JsValue::UNDEFINED,
161 |   ));
162 | 
163 |   // hash the image while we wait for the upload to finish
164 |   let hash = hash_image(&image);
165 |   let _ = put_res.await?;
166 | 
167 |   Response::from_json(&ResponseJson {
168 |     key,
169 |     width,
170 |     height,
171 |     size,
172 |     hash,
173 |     sha,
174 |   })
175 | }
176 | 
177 | fn resize(image: DynamicImage, width: u32, height: u32) -> DynamicImage {
178 |   let pixel_type = match image {
179 |     DynamicImage::ImageRgb8(_) => fr::PixelType::U8x3,
180 |     DynamicImage::ImageRgba8(_) => fr::PixelType::U8x4,
181 |     DynamicImage::ImageLuma8(_) => fr::PixelType::U8,
182 |     DynamicImage::ImageLumaA8(_) => fr::PixelType::U8x2,
183 |     _ => unreachable!(),
184 |   };
185 | 
186 |   let mut src_img = fr::Image::from_vec_u8(
187 |     NonZeroU32::new(image.width()).unwrap(),
188 |     NonZeroU32::new(image.height()).unwrap(),
189 |     image.into_bytes(),
190 |     pixel_type,
191 |   )
192 |   .unwrap();
193 | 
194 |   // multiple RGB channels of source image by alpha channel
195 |   // (not required for the Nearest algorithm)
196 |   let alpha_mul_div = fr::MulDiv::default();
197 |   if pixel_type == fr::PixelType::U8x4 || pixel_type == fr::PixelType::U8x2 {
198 |     alpha_mul_div
199 |       .multiply_alpha_inplace(&mut src_img.view_mut())
200 |       .unwrap();
201 |   }
202 | 
203 |   let mut dst_img = fr::Image::new(
204 |     NonZeroU32::new(width).unwrap(),
205 |     NonZeroU32::new(height).unwrap(),
206 |     src_img.pixel_type(),
207 |   );
208 | 
209 |   let mut dst_view = dst_img.view_mut();
210 | 
211 |   let mut resizer = fr::Resizer::new(fr::ResizeAlg::Convolution(fr::FilterType::Lanczos3));
212 |   resizer.resize(&src_img.view(), &mut dst_view).unwrap();
213 | 
214 |   if pixel_type == fr::PixelType::U8x4 || pixel_type == fr::PixelType::U8x2 {
215 |     alpha_mul_div.divide_alpha_inplace(&mut dst_view).unwrap();
216 |   }
217 | 
218 |   match pixel_type {
219 |     fr::PixelType::U8x3 => DynamicImage::ImageRgb8(
220 |       image::RgbImage::from_vec(
221 |         dst_img.width().get(),
222 |         dst_img.height().get(),
223 |         dst_img.into_vec(),
224 |       )
225 |       .unwrap(),
226 |     ),
227 |     fr::PixelType::U8x4 => DynamicImage::ImageRgba8(
228 |       image::RgbaImage::from_vec(
229 |         dst_img.width().get(),
230 |         dst_img.height().get(),
231 |         dst_img.into_vec(),
232 |       )
233 |       .unwrap(),
234 |     ),
235 |     fr::PixelType::U8 => DynamicImage::ImageLuma8(
236 |       image::GrayImage::from_vec(
237 |         dst_img.width().get(),
238 |         dst_img.height().get(),
239 |         dst_img.into_vec(),
240 |       )
241 |       .unwrap(),
242 |     ),
243 |     fr::PixelType::U8x2 => DynamicImage::ImageLumaA8(
244 |       image::GrayAlphaImage::from_vec(
245 |         dst_img.width().get(),
246 |         dst_img.height().get(),
247 |         dst_img.into_vec(),
248 |       )
249 |       .unwrap(),
250 |     ),
251 |     _ => unreachable!(),
252 |   }
253 | }
254 | 


--------------------------------------------------------------------------------
/wk-image/wrangler.toml:
--------------------------------------------------------------------------------
 1 | name = "cotrans-wk-image"
 2 | main = "build/worker/shim.mjs"
 3 | compatibility_date = '2023-07-09'
 4 | compatibility_flags = []
 5 | usage_model = 'unbound'
 6 | workers_dev = false
 7 | 
 8 | [[migrations]]
 9 | tag = "v1"
10 | new_classes = ["DOImage"]
11 | 
12 | [durable_objects]
13 | bindings = [{ name = "doImage", class_name = "DOImage" }]
14 | 
15 | [[r2_buckets]]
16 | binding = 'BUCKET_PRI'
17 | bucket_name = 'cotrans-private'
18 | 
19 | [build]
20 | command = "cargo install -q worker-build && RUSTFLAGS=\"-Ctarget-feature=+simd128\" worker-build --release . -Zbuild-std=std,panic_abort"
21 | 


--------------------------------------------------------------------------------
/wkr2/.gitignore:
--------------------------------------------------------------------------------
1 | /dist/
2 | 


--------------------------------------------------------------------------------
/wkr2/.prettierrc:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"semi": true,
 3 | 	"printWidth": 100,
 4 | 	"singleQuote": true,
 5 | 	"bracketSpacing": true,
 6 | 	"insertPragma": false,
 7 | 	"requirePragma": false,
 8 | 	"jsxSingleQuote": false,
 9 | 	"bracketSameLine": false,
10 | 	"embeddedLanguageFormatting": "auto",
11 | 	"htmlWhitespaceSensitivity": "css",
12 | 	"vueIndentScriptAndStyle": true,
13 | 	"quoteProps": "consistent",
14 | 	"proseWrap": "preserve",
15 | 	"trailingComma": "es5",
16 | 	"arrowParens": "avoid",
17 | 	"useTabs": true,
18 | 	"tabWidth": 2
19 | }
20 | 


--------------------------------------------------------------------------------
/wkr2/README.md:
--------------------------------------------------------------------------------
 1 | # Template: worker-r2
 2 | 
 3 | [![Deploy to Cloudflare Workers](https://deploy.workers.cloudflare.com/button)](https://deploy.workers.cloudflare.com/?url=https://github.com/cloudflare/templates/tree/main/worker-r2)
 4 | 
 5 | A template for interfacing with an R2 bucket from within a Cloudflare Worker.
 6 | 
 7 | Please refer to the [Use R2 from Workers](https://developers.cloudflare.com/r2/data-access/workers-api/workers-api-usage/) documentation when using this template.
 8 | 
 9 | ## Setup
10 | 
11 | To create a `my-project` directory using this template, run:
12 | 
13 | ```sh
14 | $ npm init cloudflare my-project worker-r2
15 | # or
16 | $ yarn create cloudflare my-project worker-r2
17 | # or
18 | $ pnpm create cloudflare my-project worker-r2
19 | ```
20 | 
21 | > **Note:** Each command invokes [`create-cloudflare`](https://www.npmjs.com/package/create-cloudflare) for project creation.
22 | 
23 | ## Getting started
24 | 
25 | Run the following commands in the console:
26 | 
27 | ```sh
28 | # Next, make sure you've logged in
29 | npx wrangler login
30 | 
31 | # Create your R2 bucket
32 | npx wrangler r2 bucket create <YOUR_BUCKET_NAME>
33 | 
34 | # Add config to wrangler.toml as instructed
35 | 
36 | # Deploy the worker
37 | npx wrangler deploy
38 | ```
39 | 
40 | Then test out your new Worker!
41 | 
42 | ## Note about access and privacy
43 | 
44 | With the default code in this template, every incoming request has the ability to interact with your R2 bucket. This means your bucket is publicly exposed and its contents can be accessed and modified by undesired actors.
45 | 
46 | You must define authorization logic to determine who can perform what actions to your bucket. To know more about this take a look at the [Bucket access and privacy](https://developers.cloudflare.com/r2/data-access/workers-api/workers-api-usage/#6-bucket-access-and-privacy) section of the **Use R2 from Workers** documentation
47 | 


--------------------------------------------------------------------------------
/wkr2/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "private": true,
 3 |   "dependencies": {
 4 |     "jose": "^4.14.4",
 5 |     "zod": "^3.21.4"
 6 |   },
 7 |   "devDependencies": {
 8 |     "@cloudflare/workers-types": "^4.20230717.1"
 9 |   }
10 | }
11 | 


--------------------------------------------------------------------------------
/wkr2/src/index.ts:
--------------------------------------------------------------------------------
 1 | import { importSPKI, jwtVerify } from 'jose'
 2 | import { z } from 'zod'
 3 | 
 4 | export interface Env {
 5 |   JWT_PUBLIC_KEY: string
 6 |   JWT_AUDIENCE: string
 7 |   BUCKET: R2Bucket
 8 | }
 9 | 
10 | const JWTSchema = z.object({
11 |   // files
12 |   f: z.array(z.string()).optional(),
13 |   // directories
14 |   d: z.array(z.string().endsWith('/')).optional(),
15 |   // permissions
16 |   p: z.array(z.enum(['GET', 'PUT', 'DELETE'])),
17 | })
18 | 
19 | export default {
20 |   async fetch(request: Request, env: Env): Promise<Response> {
21 |     const jwt_public_key = await importSPKI(env.JWT_PUBLIC_KEY, 'ES256')
22 | 
23 |     const url = new URL(request.url)
24 |     const file = url.pathname.slice(1)
25 |     const token = url.searchParams.get('t')
26 | 
27 |     if (token === null)
28 |       return new Response(JSON.stringify({ code: 'missing_token' }), { status: 400 })
29 | 
30 |     // parse token
31 |     let jwt: z.infer<typeof JWTSchema>
32 |     try {
33 |       const verified = await jwtVerify(token, jwt_public_key, {
34 |         algorithms: ['ES256'],
35 |         // issuer: 'wk:gateway:mit',
36 |         audience: env.JWT_AUDIENCE,
37 |         maxTokenAge: '4h',
38 |       })
39 |       jwt = JWTSchema.parse(verified.payload)
40 |       if (!jwt.f?.length && !jwt.d?.length)
41 |         throw new Error('Missing file or directory')
42 |     }
43 |     catch (error) {
44 |       console.error(String(error instanceof Error ? error.stack : error))
45 |       return new Response(JSON.stringify({ code: 'invalid_token' }), { status: 400 })
46 |     }
47 | 
48 |     // check permissions
49 |     if (!jwt.p.includes(request.method as never))
50 |       return new Response(JSON.stringify({ code: 'forbidden' }), { status: 403 })
51 | 
52 |     // check if file is in scope
53 |     if (
54 |       (jwt.f?.length && !jwt.f.includes(file))
55 |       && (jwt.d?.length && !jwt.d.some(d => file.startsWith(d)))
56 |     )
57 |       return new Response(JSON.stringify({ code: 'forbidden' }), { status: 403 })
58 | 
59 |     // handle request
60 |     switch (request.method) {
61 |       case 'PUT': {
62 |         const obj = await env.BUCKET.put(file, request.body)
63 |         return new Response(JSON.stringify({ code: 'ok', file, size: obj.size }))
64 |       }
65 | 
66 |       case 'GET': {
67 |         const obj = await env.BUCKET.get(file)
68 | 
69 |         if (obj === null)
70 |           return new Response(JSON.stringify({ code: 'not_found' }), { status: 404 })
71 | 
72 |         const headers = new Headers()
73 |         obj.writeHttpMetadata(headers)
74 |         headers.set('etag', obj.httpEtag)
75 | 
76 |         return new Response(obj.body, { headers })
77 |       }
78 | 
79 |       case 'DELETE': {
80 |         await env.BUCKET.delete(file)
81 |         return new Response(JSON.stringify({ code: 'ok', file }))
82 |       }
83 | 
84 |       default:
85 |         return new Response(JSON.stringify({ code: 'method_not_allowed' }), { status: 405 })
86 |     }
87 |   },
88 | }
89 | 


--------------------------------------------------------------------------------
/wkr2/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "baseUrl": ".",
 4 |     "module": "ESNext",
 5 |     "target": "ESNext",
 6 |     "lib": ["ESNext", "DOM", "DOM.Iterable"],
 7 |     "types": ["@cloudflare/workers-types"],
 8 |     "strict": true,
 9 |     "esModuleInterop": true,
10 |     "skipLibCheck": true,
11 |     "moduleResolution": "node",
12 |     "jsx": "preserve",
13 |     "resolveJsonModule": true,
14 |     "strictNullChecks": true,
15 |     "forceConsistentCasingInFileNames": true,
16 |     "paths": {
17 |       "@/*": ["*"]
18 |     }
19 |   },
20 |   "include": ["**/*.ts"],
21 |   "exclude": ["dist", "node_modules"]
22 | }
23 | 


--------------------------------------------------------------------------------
/wkr2/wrangler.toml:
--------------------------------------------------------------------------------
 1 | name = "cotrans-wkr2-public"
 2 | main = "src/index.ts"
 3 | compatibility_date = '2023-07-09'
 4 | compatibility_flags = []
 5 | workers_dev = false
 6 | usage_model = 'bundled'
 7 | 
 8 | [[r2_buckets]]
 9 | binding = 'BUCKET'
10 | bucket_name = 'cotrans-public'
11 | 
12 | [placement]
13 | mode = "smart"
14 | 
15 | [env.private]
16 | name = "cotrans-wkr2-private"
17 | 
18 | [[env.private.r2_buckets]]
19 | binding = 'BUCKET'
20 | bucket_name = 'cotrans-private'
21 | 


--------------------------------------------------------------------------------