├── vercel.json
├── tsconfig.json
├── public
    ├── stats
    │   └── js
    │   │   └── script.js
    ├── banner.png
    ├── robots.txt
    ├── favicon-on-dark.png
    ├── images
    │   ├── the-end.png
    │   ├── cpu-pleading-face.png
    │   ├── elf-data-section.png
    │   ├── elf-file-structure.png
    │   ├── init-process-tree.png
    │   ├── binprm-buf-changelog.png
    │   ├── fetch-execute-cycle.png
    │   ├── instruction-pointer.png
    │   ├── writing-this-article.png
    │   ├── gnu-linux-elf-drawing.jpg
    │   ├── hardware-interrupt-meme.png
    │   ├── interrupt-vector-table.png
    │   ├── elf-program-header-types.png
    │   ├── kernel-mode-vs-user-mode.png
    │   ├── linux-shebang-truncation.png
    │   ├── static-vs-dynamic-linking.png
    │   ├── keyboard-hardware-interrupt.png
    │   ├── multilevel-paging-explainer.png
    │   ├── page-table-entry-permissions.png
    │   ├── virtual-memory-mmu-example.png
    │   ├── 4kib-paging-address-breakdown.png
    │   ├── higher-half-kernel-memory-map.png
    │   ├── linux-scheduler-target-latency.png
    │   ├── process-virtual-memory-mapping.png
    │   ├── elf-section-header-table-diagram.png
    │   ├── linux-program-execution-process.png
    │   ├── syscall-architecture-differences.png
    │   ├── assembly-to-machine-code-translation.png
    │   └── demand-paging-with-page-faults-comic.png
    ├── favicon-on-light.png
    ├── editions
    │   └── printable.pdf
    ├── github-images
    │   ├── banner-dark.png
    │   └── banner-light.png
    ├── orpheus-flag.svg
    └── squiggles
    │   └── bottom.svg
├── postcss.config.cjs
├── src
    ├── env.d.ts
    ├── metadata.ts
    ├── content
    │   ├── config.ts
    │   └── chapters
    │   │   ├── 0-intro.mdx
    │   │   ├── 7-epilogue.mdx
    │   │   ├── 2-slice-dat-time.mdx
    │   │   ├── 4-becoming-an-elf-lord.mdx
    │   │   ├── 1-the-basics.mdx
    │   │   ├── 6-lets-talk-about-forks-and-cows.mdx
    │   │   ├── 5-the-translator-in-your-computer.mdx
    │   │   └── 3-how-to-run-a-program.mdx
    ├── components
    │   ├── EditButton.astro
    │   ├── DowngradeHeadings.astro
    │   ├── TOCList.astro
    │   ├── ScrollPadding.astro
    │   ├── OldNav.astro
    │   ├── ColoredTitle.astro
    │   ├── CodeBlock.astro
    │   ├── ExternalNav.astro
    │   └── SEO.astro
    ├── styles
    │   ├── 404.css
    │   ├── home.css
    │   ├── chapter.css
    │   ├── one-pager.css
    │   └── global.css
    └── pages
    │   ├── 404.astro
    │   ├── editions
    │       └── one-pager.astro
    │   ├── index.astro
    │   └── [...slug].astro
├── .gitignore
├── package.json
├── astro.config.mjs
├── LICENSE
├── .github
    └── workflows
    │   └── deploy.yml
├── README.md
└── scripts
    ├── pdfgen.js
    └── run-pdf-ci.mjs


/vercel.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"trailingSlash": false
3 | }
4 | 


--------------------------------------------------------------------------------
/tsconfig.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"extends": "astro/tsconfigs/base"
3 | }
4 | 


--------------------------------------------------------------------------------
/public/stats/js/script.js:
--------------------------------------------------------------------------------
1 | // This is a Vercel rewrite in production, see vercel.json.


--------------------------------------------------------------------------------
/postcss.config.cjs:
--------------------------------------------------------------------------------
1 | module.exports = {
2 | 	plugins: [ require('postcss-nesting') ]
3 | }


--------------------------------------------------------------------------------
/public/banner.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/banner.png


--------------------------------------------------------------------------------
/public/robots.txt:
--------------------------------------------------------------------------------
1 | User-agent: *
2 | Allow: /
3 | 
4 | Sitemap: https://cpu.land/sitemap-index.xml
5 | 


--------------------------------------------------------------------------------
/src/env.d.ts:
--------------------------------------------------------------------------------
1 | /// <reference path="../.astro/types.d.ts" />
2 | /// <reference types="astro/client" />
3 | 


--------------------------------------------------------------------------------
/public/favicon-on-dark.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/favicon-on-dark.png


--------------------------------------------------------------------------------
/public/images/the-end.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/the-end.png


--------------------------------------------------------------------------------
/public/favicon-on-light.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/favicon-on-light.png


--------------------------------------------------------------------------------
/public/editions/printable.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/editions/printable.pdf


--------------------------------------------------------------------------------
/public/github-images/banner-dark.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/github-images/banner-dark.png


--------------------------------------------------------------------------------
/public/images/cpu-pleading-face.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/cpu-pleading-face.png


--------------------------------------------------------------------------------
/public/images/elf-data-section.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/elf-data-section.png


--------------------------------------------------------------------------------
/public/images/elf-file-structure.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/elf-file-structure.png


--------------------------------------------------------------------------------
/public/images/init-process-tree.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/init-process-tree.png


--------------------------------------------------------------------------------
/public/github-images/banner-light.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/github-images/banner-light.png


--------------------------------------------------------------------------------
/public/images/binprm-buf-changelog.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/binprm-buf-changelog.png


--------------------------------------------------------------------------------
/public/images/fetch-execute-cycle.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/fetch-execute-cycle.png


--------------------------------------------------------------------------------
/public/images/instruction-pointer.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/instruction-pointer.png


--------------------------------------------------------------------------------
/public/images/writing-this-article.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/writing-this-article.png


--------------------------------------------------------------------------------
/public/images/gnu-linux-elf-drawing.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/gnu-linux-elf-drawing.jpg


--------------------------------------------------------------------------------
/public/images/hardware-interrupt-meme.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/hardware-interrupt-meme.png


--------------------------------------------------------------------------------
/public/images/interrupt-vector-table.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/interrupt-vector-table.png


--------------------------------------------------------------------------------
/public/images/elf-program-header-types.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/elf-program-header-types.png


--------------------------------------------------------------------------------
/public/images/kernel-mode-vs-user-mode.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/kernel-mode-vs-user-mode.png


--------------------------------------------------------------------------------
/public/images/linux-shebang-truncation.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/linux-shebang-truncation.png


--------------------------------------------------------------------------------
/public/images/static-vs-dynamic-linking.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/static-vs-dynamic-linking.png


--------------------------------------------------------------------------------
/public/images/keyboard-hardware-interrupt.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/keyboard-hardware-interrupt.png


--------------------------------------------------------------------------------
/public/images/multilevel-paging-explainer.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/multilevel-paging-explainer.png


--------------------------------------------------------------------------------
/public/images/page-table-entry-permissions.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/page-table-entry-permissions.png


--------------------------------------------------------------------------------
/public/images/virtual-memory-mmu-example.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/virtual-memory-mmu-example.png


--------------------------------------------------------------------------------
/public/images/4kib-paging-address-breakdown.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/4kib-paging-address-breakdown.png


--------------------------------------------------------------------------------
/public/images/higher-half-kernel-memory-map.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/higher-half-kernel-memory-map.png


--------------------------------------------------------------------------------
/public/images/linux-scheduler-target-latency.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/linux-scheduler-target-latency.png


--------------------------------------------------------------------------------
/public/images/process-virtual-memory-mapping.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/process-virtual-memory-mapping.png


--------------------------------------------------------------------------------
/public/images/elf-section-header-table-diagram.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/elf-section-header-table-diagram.png


--------------------------------------------------------------------------------
/public/images/linux-program-execution-process.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/linux-program-execution-process.png


--------------------------------------------------------------------------------
/public/images/syscall-architecture-differences.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/syscall-architecture-differences.png


--------------------------------------------------------------------------------
/public/images/assembly-to-machine-code-translation.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/assembly-to-machine-code-translation.png


--------------------------------------------------------------------------------
/public/images/demand-paging-with-page-faults-comic.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Revisto/putting-the-you-in-cpu/main/public/images/demand-paging-with-page-faults-comic.png


--------------------------------------------------------------------------------
/src/metadata.ts:
--------------------------------------------------------------------------------
1 | export const abstract = 'Curious exactly what happens when you run a program on your computer? Learn how multiprocessing works, what system calls really are, how computers manage memory with hardware interrupts, and how Linux loads executables.'


--------------------------------------------------------------------------------
/src/content/config.ts:
--------------------------------------------------------------------------------
 1 | import { z, defineCollection } from 'astro:content'
 2 | 
 3 | export const collections = {
 4 | 	chapters: defineCollection({
 5 | 		schema: z.object({
 6 | 			chapter: z.number(),
 7 | 			title: z.string(),
 8 | 			shortname: z.string(),
 9 | 			updatedAt: z.date()
10 | 		})
11 | 	})
12 | }
13 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # build output
 2 | dist
 3 | 
 4 | # dependencies
 5 | node_modules/
 6 | .snowpack/
 7 | 
 8 | # logs
 9 | npm-debug.log*
10 | yarn-debug.log*
11 | yarn-error.log*
12 | 
13 | # environment variables
14 | .env
15 | .env.production
16 | 
17 | # macOS-specific files
18 | .DS_Store
19 | 
20 | .vercel
21 | .astro
22 | 


--------------------------------------------------------------------------------
/src/components/EditButton.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getEntryBySlug } from 'astro:content'
 3 | 
 4 | export interface Props {
 5 | 	chapterSlug: string
 6 | }
 7 | 
 8 | const { chapterSlug } = Astro.props
 9 | const chapter = await getEntryBySlug('chapters', chapterSlug)
10 | 
11 | const url = 'https://github.com/tehlug/putting-the-you-in-cpu/tree/main/src/content/chapters/'
12 | 	+ chapter.data.chapter + '-' + chapterSlug + '.mdx'
13 | ---
14 | 
15 | <a class='edit-button' href={url} target='_blank'>ویرایش در گیت‌هاب</a>
16 | 


--------------------------------------------------------------------------------
/src/components/DowngradeHeadings.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { JSDOM } from 'jsdom'
 3 | 
 4 | const html = await Astro.slots.render('default')
 5 | const dom = new JSDOM(html)
 6 | 
 7 | // Downgrade all headings by one level
 8 | for (let i = 5; i >= 1; i--) {
 9 | 	const headings = dom.window.document.querySelectorAll(`h${i}`)
10 | 	for (const heading of headings) {
11 | 		const newHeading = dom.window.document.createElement(`h${i + 1}`)
12 | 		for (const attribute of heading.attributes) {
13 | 			newHeading.setAttribute(attribute.name, attribute.value)
14 | 		}
15 | 		newHeading.innerHTML = heading.innerHTML
16 | 		heading.replaceWith(newHeading)
17 | 	}
18 | }
19 | 
20 | const newHtml = dom.serialize()
21 | ---
22 | 
23 | <Fragment set:html={newHtml} />
24 | 


--------------------------------------------------------------------------------
/src/components/TOCList.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | interface Props {
 3 | 	headings: { depth: number, slug: string, text: string }[]
 4 | }
 5 | 
 6 | const firstLayer = []
 7 | let depth
 8 | 
 9 | for (const heading of Astro.props.headings) {
10 | 	if (!firstLayer.length || heading.depth <= depth) {
11 | 		depth = heading.depth
12 | 		firstLayer.push({ ...heading, children: [] })
13 | 	} else if (heading.depth > depth) {
14 | 		firstLayer.at(-1).children.push(heading)
15 | 	}
16 | }
17 | ---
18 | 
19 | <ul>
20 | 	{firstLayer.map(heading => (
21 | 		<li>
22 | 			<a href={'#' + heading.slug} data-scrollspy={heading.slug}>
23 | 				{heading.text}
24 | 			</a>
25 | 			{heading.children.length > 0 ? <Astro.self headings={heading.children} /> : null}
26 | 		</li>
27 | 	))}
28 | </ul>
29 | 


--------------------------------------------------------------------------------
/src/styles/404.css:
--------------------------------------------------------------------------------
 1 | html {
 2 | 	background: #000000;
 3 | 	color: #00ff00;
 4 | }
 5 | 
 6 | main {
 7 | 	font-family: var(--font-mono);
 8 | 	font-size: 1.1rem;
 9 | 	text-align: left;
10 | 	padding: 60px;
11 | 	line-height: 2.2;
12 | }
13 | 
14 | h1 {
15 | 	font-weight: bold;
16 | 	font-size: inherit;
17 | }
18 | 
19 | a {
20 | 	--color: currentColor;
21 | 	--hover-background: #004800;
22 | 	text-underline-offset: 6px;
23 | 	text-decoration: underline;
24 | }
25 | 
26 | h1, p {
27 | 	margin: 0;
28 | 	line-height: inherit;
29 | }
30 | 
31 | @media (max-width: 600px) {
32 | 	main {
33 | 		padding: 30px 30px;
34 | 		font-size: 0.9rem;
35 | 	}
36 | 
37 | 	h1, p {
38 | 		margin: 16px 0;
39 | 	}
40 | }
41 | 
42 | @media (max-width: 400px) {
43 | 	main {
44 | 		font-size: 0.8rem;
45 | 	}
46 | }
47 | 


--------------------------------------------------------------------------------
/src/components/ScrollPadding.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | export interface Props {
 3 | 	hideEditions?: boolean
 4 | }
 5 | 
 6 | const { hideEditions } = Astro.props
 7 | ---
 8 | 
 9 | <footer class='scroll-padding'>
10 | 	<div class='content'>
11 | 		<p>[این جا عمداً خالی گذاشته شده]</p>
12 | 		<p>ته هر صفحه یکم فضای اضافه داره تا خوندن راحت‌تر باشه.</p>
13 | 		<p>
14 | 			<a target='_blank' href='https://github.com/tehlug/putting-the-you-in-cpu/tree/main/src/content/chapters'>
15 | 				متن‌باز با ❤︎ روی گیت‌هاب
16 | 			</a>
17 | 		</p>
18 | 		{hideEditions ? null : <>
19 | 			<hr />
20 | 			<p>
21 | 				نسخه‌های دیگه:
22 | 				<a href='editions/one-pager'>تک‌صفحه‌ای</a> &middot;
23 | 				<a href='editions/printable.pdf'>PDF</a><!--  &middot;
24 | 				<a href='editions/book.epub'>EPUB</a> -->
25 | 			</p>
26 | 		</>}
27 | 	</div>
28 | </footer>
29 | 


--------------------------------------------------------------------------------
/src/components/OldNav.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getCollection, CollectionEntry } from 'astro:content'
 3 | 
 4 | export interface Props {
 5 | 	chapterSlug: CollectionEntry<'chapters'>['slug']
 6 | }
 7 | 
 8 | const { chapterSlug } = Astro.props
 9 | const allChapters = await getCollection('chapters')
10 | ---
11 | 
12 | <details class='old-nav'>
13 | 	<summary>همه فصل‌ها</summary>
14 | 
15 | 	<ol start='0'>
16 | 		<li>
17 | 			<a href=''>Intro</a>
18 | 		</li>
19 | 		{allChapters
20 | 			.filter(chapter => chapter.data.chapter !== 0) // Skip the intro
21 | 			.map(otherChapter => (
22 | 				<li class={otherChapter.slug === chapterSlug ? 'active' : ''}>
23 | 					<a href={otherChapter.slug} aria-current={otherChapter.slug === chapterSlug ? 'page' : undefined}>
24 | 						{otherChapter.data.title}
25 | 					</a>
26 | 				</li>
27 | 			))
28 | 		}
29 | 	</ol>
30 | </details>
31 | 


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"name": "putting-the-you-in-cpu",
 3 | 	"version": "0.0.1",
 4 | 	"private": true,
 5 | 	"license": "MIT",
 6 | 	"scripts": {
 7 | 		"dev": "astro dev",
 8 | 		"fix-images": "node scripts/fix-image-paths.mjs",
 9 | 		"build": "astro build",
10 | 		"preview": "astro preview",
11 | 		"generate-pdf:local": "node scripts/pdfgen.js",
12 | 		"generate-pdf:ci": "node scripts/run-pdf-ci.mjs"
13 | 	},
14 | 	"devDependencies": {
15 | 		"@astrojs/mdx": "^4.3.0",
16 | 		"@astrojs/sitemap": "^3.4.0",
17 | 		"@astrojs/vercel": "^8.0.4",
18 | 		"@types/jsdom": "^21.1.7",
19 | 		"astro": "^5.8.1",
20 | 		"glob": "^11.0.2",
21 | 		"jsdom": "^26.1.0",
22 | 		"postcss-nesting": "^13.0.1",
23 | 		"puppeteer": "^21.0.2",
24 | 		"rehype-external-links": "^3.0.0",
25 | 		"rehype-preset-minify": "^7.0.1",
26 | 		"shiki": "^0.14.2",
27 | 		"start-server-and-test": "^2.0.12"
28 | 	}
29 | }
30 | 


--------------------------------------------------------------------------------
/astro.config.mjs:
--------------------------------------------------------------------------------
 1 | import { defineConfig } from 'astro/config'
 2 | import mdx from '@astrojs/mdx'
 3 | import sitemap from '@astrojs/sitemap'
 4 | import rehypeExternalLinks from 'rehype-external-links'
 5 | import rehypePresetMinify from 'rehype-preset-minify'
 6 | 
 7 | const rehypeExternalLinksConfig = [
 8 |     rehypeExternalLinks,
 9 |     { target: '_blank', rel: ['noopener', 'noreferrer'] }
10 | ]
11 | 
12 | export default defineConfig({
13 | 	site: 'https://tehlug.github.io/putting-the-you-in-cpu/',
14 | 	base: '/putting-the-you-in-cpu/',
15 | 	trailingSlash: 'never',
16 | 	output: 'static',
17 | 	server: {
18 | 		port: parseInt(process.env.PORT || '3000')
19 | 	},
20 | 	integrations: [
21 | 		mdx({
22 | 			rehypePlugins: [ rehypeExternalLinksConfig, rehypePresetMinify ]
23 | 		}),
24 | 		sitemap({
25 | 			filter: page => page !== 'https://cpu.land/404'
26 | 		})
27 | 	],
28 | 	markdown: {
29 | 		smartypants: true,
30 | 		rehypePlugins: [ rehypeExternalLinksConfig ],
31 | 		shikiConfig: {
32 | 			theme: 'one-dark-pro'
33 | 		}
34 | 	}
35 | })
36 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2023 Lexi Mattick
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/src/pages/404.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import '../styles/global.css'
 3 | import '../styles/404.css'
 4 | 
 5 | const url = new URL(Astro.url.pathname, Astro.site)
 6 | url.pathname = url.pathname.replace(/\/$/, '') // Strip slash from the end of the path
 7 | 
 8 | const baseUrl = import.meta.env.BASE_URL && import.meta.env.BASE_URL !== '/' ? `${import.meta.env.BASE_URL}/` : '/'
 9 | ---
10 | 
11 | <html lang='fa' dir='rtl'>
12 | <head>
13 | 	<meta charset='utf-8' />
14 | 	<meta name='viewport' content='width=device-width, initial-scale=1' />
15 | 	<base href={baseUrl} />
16 | 
17 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazirmatn@v33.003/Vazirmatn-font-face.css" rel="stylesheet" type="text/css" />
18 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazir-code-font@v1.1.2/dist/font-face.css" rel="stylesheet" type="text/css" />
19 | 
20 | 	<title>Not Found | Putting the "You" in CPU</title>
21 | 	
22 | 	<meta http-equiv='Status' content='404 Not Found' />
23 | 	<meta name='robots' content='noindex' />
24 | 	
25 | 	<meta name='theme-color' content='#845ef7' />
26 | 	<link rel='icon' href='favicon-on-dark.png' media='(prefers-color-scheme: dark)' />
27 | 	<link rel='icon' href='favicon-on-light.png' media='(prefers-color-scheme: light)' />
28 | 	
29 | 	<script defer data-domain='cpu.land' src='https://plausible.io/js/script.js' />
30 | </head>
31 | <body>
32 | 	
33 | 	<main>
34 | 		<p>$ curl {url.toString()}</p>
35 | 		<h1>Segmentation fault (core dumped)</h1>
36 | 		<br>
37 | 		<p>$ # Looks like you wound up accessing a memory region &mdash; errr, page &mdash; that doesn&lsquo;t exist.</p>
38 | 		<p>$ # Want to learn more about page faults? <a href='/'>Start from the beginning!</a></p>
39 | 	</main>
40 | </body>
41 | </html>
42 | 


--------------------------------------------------------------------------------
/src/components/ColoredTitle.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | export interface Props {
 3 | 	onDark?: boolean
 4 | }
 5 | 
 6 | const { onDark } = Astro.props
 7 | 
 8 | const onLightColors = [ '#e03131', '#f59f00', '#2f9e44', '#1971c2', '#9c36b5' ]
 9 | const onDarkColors = [ '#fa5252', '#fab005', '#40c057', '#228be6', '#be4bdb' ]
10 | ---
11 | 
12 | <span class={`colored-title ${onDark ? 'on-dark' : ''}`}><span>Putting</span>{' '}<span>the</span>{' '}<span>&ldquo;You&rdquo;</span>{' '}<span>in</span>{' '}<span>CPU</span></span>
13 | 
14 | <style define:vars={{
15 | 	onDark0: onDarkColors[0],
16 | 	onDark1: onDarkColors[1],
17 | 	onDark2: onDarkColors[2],
18 | 	onDark3: onDarkColors[3],
19 | 	onDark4: onDarkColors[4],
20 | 	onLight0: onLightColors[0],
21 | 	onLight1: onLightColors[1],
22 | 	onLight2: onLightColors[2],
23 | 	onLight3: onLightColors[3],
24 | 	onLight4: onLightColors[4],
25 | }}>
26 | 	.colored-title {
27 | 		& :nth-child(1) { color: var(--onLight0); }
28 | 		& :nth-child(2) { color: var(--onLight1); }
29 | 		& :nth-child(3) { color: var(--onLight2); }
30 | 		& :nth-child(4) { color: var(--onLight3); }
31 | 		& :nth-child(5) { color: var(--onLight4); }
32 | 	}
33 | 
34 | 	.colored-title.on-dark {
35 | 		& :nth-child(1) { color: var(--onDark0); }
36 | 		& :nth-child(2) { color: var(--onDark1); }
37 | 		& :nth-child(3) { color: var(--onDark2); }
38 | 		& :nth-child(4) { color: var(--onDark3); }
39 | 		& :nth-child(5) { color: var(--onDark4); }
40 | 	}
41 | 
42 | 	@media print {
43 | 		.colored-title, .colored-title.on-dark {
44 | 			& :nth-child(1) { color: var(--onLight0); }
45 | 			& :nth-child(2) { color: var(--onLight1); }
46 | 			& :nth-child(3) { color: var(--onLight2); }
47 | 			& :nth-child(4) { color: var(--onLight3); }
48 | 			& :nth-child(5) { color: var(--onLight4); }
49 | 		}
50 | 	}
51 | </style>


--------------------------------------------------------------------------------
/src/content/chapters/0-intro.mdx:
--------------------------------------------------------------------------------
 1 | ---
 2 | chapter: 0
 3 | title: مقدمه
 4 | shortname: مقدمه
 5 | slug: intro
 6 | updatedAt: 2023-07-18T20:39:49.365Z
 7 | ---
 8 | 
 9 | من تاحالا کارهای زیادی با کامپیوترها انجام دادم, اما همیشه یه خلأ رو توی دانشم داشتم: دقیقا چه اتفاقی میوفته وقتی یه برنامه رو روی کامپیوتر اجرا می‌کنی؟ من در مورد این خلأ فکر کردم — بیشتر دانش لازم سطح پایین رو داشتم, اما مدام تلاش می‌کردم که چیزهای مختلف رو کنار هم بذارم تا بفهممش. آیا واقعا برنامه‌ها مستقیم روی CPU اجرا می‌شن یا مکانیزم دیگه‌ای در جریانه؟ یا حتی syscallها، من ازشون زیاد استفاده کردم ولی اونا واقعا چطور کار می‌کنن؟ چطوری چند تا برنامه همزمان اجرا میشن؟
10 | 
11 | <img src='images/writing-this-article.png' loading='eager' style='margin: 40px 0;' alt='A scrawled digital drawing. Someone with long hair is confused as they peer down at a computer ingesting binary. Suddenly, they have an idea! They start researching on a desktop computer with bad posture.' width='1708' height='536' />
12 | 
13 | من دیگه طاقت نیوردم و هر چقدر که می‌تونستم شروع به خوندن کردم. اگه قصد رفتن به دانشگاه رو ندارید قرار نیست که منابع جامع زیادی برای درک طرز کار سیستم‌ها پیدا کنید; بنابراین من مجبور بودم طیف وسیعی از منابع متفاوتی رو که گاهی حتی اطلاعات متناقض به همراه داشتن رو بررسی کنم. حالا پس از چند هفته تحقیق و تقریبا ۴۰ صفحه یادداشت، فکر  می‌کنم درک خیلی بهتری از نحوه کارکرد کامپیوترها از زمان روشن شدن تا اجرای برنامه‌ها دارم. من واقعا حاضر بودم سر یه مقاله که بهم چیزایی که این مدت یاد گرفتم رو یاد بده آدم بکشم. و الان دارم همون چیزی رو می‌نویسم که حسرتش رو داشتم که کاش یکی برای من نوشته بود.
14 | 
15 | و می‌دونی چی میگن... وقتی واقعاً یه چیزی رو فهمیدی که بتونی برای یکی دیگه توضیحش بدی.
16 | 
17 | > وقت نداری؟ حس می‌کنی این چیزا رو بلدی؟
18 | >
19 | > فصل ۳ رو بخون، قول می‌دم که قراره چیزای جدیدی یاد بگیری، مگه اینکه یکی مثل لینوس توروالدز باشی!
20 | 


--------------------------------------------------------------------------------
/.github/workflows/deploy.yml:
--------------------------------------------------------------------------------
 1 | name: Deploy to GitHub Pages
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   workflow_dispatch:
 8 | 
 9 | concurrency:
10 |   group: "pages"
11 |   cancel-in-progress: false
12 | 
13 | jobs:
14 |   build:
15 |     runs-on: ubuntu-latest
16 |     permissions:
17 |       contents: write
18 |     steps:
19 |       - name: Checkout repository
20 |         uses: actions/checkout@v4
21 | 
22 |       - name: Set up Node.js
23 |         uses: actions/setup-node@v4
24 |         with:
25 |           node-version: '18'
26 |           cache: 'npm'
27 | 
28 |       - name: Install dependencies
29 |         run: npm install
30 | 
31 |       - name: Build project
32 |         run: npm run build
33 | 
34 |       - name: Generate PDF
35 |         run: npm run generate-pdf:ci
36 | 
37 |       - name: Copy PDF to dist directory
38 |         run: cp public/editions/printable.pdf dist/editions/printable.pdf
39 | 
40 |       - name: Commit and push PDF
41 |         run: |
42 |           git config --global user.name 'github-actions[bot]'
43 |           git config --global user.email 'github-actions[bot]@users.noreply.github.com'
44 |           git add public/editions/printable.pdf
45 |           # Check if there are changes to commit
46 |           if ! git diff --staged --quiet; then
47 |             git commit -m "docs: update printable.pdf [skip ci]"
48 |             git push
49 |           else
50 |             echo "No changes to printable.pdf to commit."
51 |           fi
52 | 
53 |       - name: Upload artifact
54 |         uses: actions/upload-pages-artifact@v3
55 |         with:
56 |           path: ./dist
57 | 
58 |   deploy:
59 |     needs: build
60 |     runs-on: ubuntu-latest
61 |     permissions:
62 |       pages: write
63 |       id-token: write
64 |     environment:
65 |       name: github-pages
66 |       url: ${{ steps.deployment.outputs.page_url }}
67 |     steps:
68 |       - name: Deploy to GitHub Pages
69 |         id: deployment
70 |         uses: actions/deploy-pages@v4
71 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | <picture>
 2 |   <source media='(prefers-color-scheme: dark)' srcset='./public/github-images/banner-dark.png'>
 3 |   <img src='./public/github-images/banner-light.png' alt=''>
 4 | </picture>
 5 | 
 6 | <h1 align='center'>Putting the "You" in CPU</h1>
 7 | <p align='center'>A technical explainer of how your computer runs programs, from start to finish.</p>
 8 | <p align='center'>by <a href='https://github.com/kognise'>@kognise</a> and <a href='https://github.com/hackclub'>@hackclub</a></p>
 9 | <br>
10 | 
11 | ## From the beginning...
12 | 
13 | I've done [a lot of things with computers](https://github.com/kognise), but I've always had a gap in my knowledge: what exactly happens when you run a program on your computer? I thought about this gap — I had most of the requisite low-level knowledge, but I was struggling to piece everything together. Are programs really executing directly on the CPU, or is something else going on? I've used syscalls, but how do they *work*? What are they, really? How do multiple programs run at the same time?
14 | 
15 | <img src='/public/images/writing-this-article.png' alt='A scrawled digital drawing. Someone with long hair is confused as they peer down at a computer ingesting binary. Suddenly, they have an idea! They start researching on a desktop computer with bad posture.' width='700' />
16 | 
17 | I cracked and started figuring as much out as possible. There aren't many comprehensive systems resources if you aren't going to college, so I had to sift through tons of different sources of varying quality and sometimes conflicting information. A couple weeks of research and almost 40 pages of notes later, I think I have a much better idea of how computers work from startup to program execution. I would've killed for one solid article explaining what I learned, so I'm writing the article that I wished I had.
18 | 
19 | And you know what they say... you only truly understand something if you can explain it to someone else.
20 | 
21 | > In a hurry? Feel like you know this stuff already?
22 | >
23 | > [Read chapter 3](https://cpu.land/how-to-run-a-program) and I guarantee you will learn something new. Unless you're like, Linus Torvalds himself.
24 | 
25 | <br>
26 | 
27 | <p align='center'><a href='https://cpu.land/the-basics'><strong>Continue to Chapter 1: The "Basics" &raquo;</strong><br>(cpu.land)</a></p>
28 | 


--------------------------------------------------------------------------------
/src/styles/home.css:
--------------------------------------------------------------------------------
  1 | @font-face {
  2 | 	font-family: 'Phantom Sans';
  3 | 	src: url('https://assets.hackclub.com/fonts/Phantom_Sans_0.7/SemiBold.woff')
  4 | 		format('woff'),
  5 | 		url('https://assets.hackclub.com/fonts/Phantom_Sans_0.7/SemiBold.woff2')
  6 | 		format('woff2');
  7 | 	font-weight: 600;
  8 | 	font-style: normal;
  9 | 	font-display: swap;
 10 | }
 11 | 
 12 | html {
 13 | 	background: #212529;
 14 | }
 15 | 
 16 | header {
 17 | 	text-align: center;
 18 | 	width: 100%;
 19 | 	padding-top: calc(30px + 8vw);
 20 | 	padding-bottom: calc(20px + 8vw);
 21 | 	display: flex;
 22 | 	flex-direction: column;
 23 | 	align-items: center;
 24 | 	position: relative;
 25 | 	color: #ced4da;
 26 | 
 27 | 	& h1 {
 28 | 		font-family: var(--font-main-title);
 29 | 		font-size: 2.5em;
 30 | 		font-weight: 600;
 31 | 		margin: 0;
 32 | 		margin-bottom: -2px;
 33 | 	}
 34 | 
 35 | 	& p {
 36 | 		line-height: 1.7;
 37 | 		font-size: 1.05em;
 38 | 		margin: 16px 0;
 39 | 	}
 40 | 
 41 | 	& .abstract {
 42 | 		font-style: italic;
 43 | 	}
 44 | 
 45 | 	& a, & a:not([href^="#"]):visited {
 46 | 		--color: currentColor;
 47 | 		--hover-background: #343a40;
 48 | 		text-decoration: underline;
 49 | 		text-decoration-color: #9775fa;
 50 | 		text-underline-offset: 4px;
 51 | 	}
 52 | 
 53 | 	& .squiggles {
 54 | 		pointer-events: none;
 55 | 		user-select: none;
 56 | 		width: 100%;
 57 | 		position: absolute;
 58 | 		left: 0;
 59 | 		opacity: 0.5;
 60 | 		z-index: -1;
 61 | 
 62 | 		&.top {
 63 | 			top: 0;
 64 | 		}
 65 | 
 66 | 		&.bottom {
 67 | 			bottom: 0;
 68 | 		}
 69 | 	}
 70 | }
 71 | 
 72 | main {
 73 | 	width: 100%;
 74 | 	background: #f8f9fa;
 75 | 	display: flex;
 76 | 	flex-direction: column;
 77 | 	align-items: center;
 78 | 	z-index: 9;
 79 | }
 80 | 
 81 | nav.external {
 82 | 	position: static;
 83 | 	background: transparent;
 84 | 	margin-top: -20px;
 85 | 
 86 | 	& a {
 87 | 		& .title {
 88 | 			color: #dee2e6;
 89 | 		}
 90 | 
 91 | 		&:hover {
 92 | 			background: #343a40;
 93 | 		}
 94 | 	}
 95 | }
 96 | 
 97 | h2 {
 98 | 	margin-top: 80px;
 99 | }
100 | 
101 | @media print {
102 | 	html, main {
103 | 		background: #ffffff;
104 | 	}
105 | 
106 | 	header .squiggles {
107 | 		display: none;
108 | 	}
109 | 
110 | 	header {
111 | 		background: transparent;
112 | 		color: #000000;
113 | 		padding: 20px;
114 | 		margin-bottom: -40px;
115 | 	}
116 | }


--------------------------------------------------------------------------------
/scripts/pdfgen.js:
--------------------------------------------------------------------------------
 1 | const puppeteer = require('puppeteer')
 2 | const fs = require('fs/promises')
 3 | const process = require('process')
 4 | const path = require('path')
 5 | 
 6 | async function getAstroConfig() {
 7 |     const configPath = path.resolve(process.cwd(), 'astro.config.mjs');
 8 |     try {
 9 |         // Ensure the import path is a file URL
10 |         const fileUrlConfigPath = `file://${configPath.startsWith('/') ? '' : '/'}${configPath.replace(/\\/g, '/')}`;
11 |         const { default: astroConfig } = await import(fileUrlConfigPath);
12 |         return {
13 |             base: astroConfig.base || '/',
14 |             port: astroConfig.server?.port || 3000 
15 |         };
16 |     } catch (e) {
17 |         console.warn(`Could not load astro.config.mjs. Using default base '/' and port 3000. Error: ${e.message}`);
18 |         return { base: '/', port: 3000 };
19 |     }
20 | }
21 | 
22 | async function pdf(url) {
23 |     const browser = await puppeteer.launch({ 
24 |         headless: 'new',
25 |         args: [
26 |             '--no-sandbox',
27 |             '--disable-setuid-sandbox',
28 |             '--disable-dev-shm-usage',
29 |             '--disable-accelerated-2d-canvas',
30 |             '--no-first-run',
31 |             '--no-zygote',
32 |             '--single-process',
33 |             '--disable-gpu'
34 |         ]
35 |     })
36 |     const page = await browser.newPage()
37 |     await page.goto(url, { waitUntil: 'networkidle0' })
38 |     const pdfData = await page.pdf({
39 |         format: 'letter',
40 |         printBackground: true
41 |     })
42 |     await browser.close()
43 |     return pdfData
44 | }
45 | 
46 | async function go() {
47 |     const { base, port } = await getAstroConfig();
48 | 
49 |     let normalizedBase = base;
50 |     if (normalizedBase !== '/') {
51 |         if (!normalizedBase.startsWith('/')) {
52 |             normalizedBase = '/' + normalizedBase;
53 |         }
54 |         if (!normalizedBase.endsWith('/')) {
55 |             normalizedBase += '/';
56 |         }
57 |     }
58 |     
59 |     const targetUrl = `http://127.0.0.1:${port}${normalizedBase}editions/one-pager`;
60 |     console.log(`Generating PDF from URL: ${targetUrl}`);
61 |     await fs.writeFile('public/editions/printable.pdf', await pdf(targetUrl));
62 | }
63 | 
64 | go().then(() => {
65 |     console.log('Done!')
66 |     process.exit(0)
67 | }).catch(error => {
68 |     console.error(error)
69 |     process.exit(1)
70 | })


--------------------------------------------------------------------------------
/scripts/run-pdf-ci.mjs:
--------------------------------------------------------------------------------
 1 | import { execSync } from 'child_process';
 2 | import path from 'path';
 3 | import { fileURLToPath, pathToFileURL } from 'url';
 4 | 
 5 | async function run() {
 6 |     const __filename = fileURLToPath(import.meta.url);
 7 |     const __dirname = path.dirname(__filename);
 8 |     const projectRoot = path.resolve(__dirname, '..');
 9 |     const configPath = path.resolve(projectRoot, 'astro.config.mjs');
10 |     console.log(`Resolved astro.config.mjs path: ${configPath}`);
11 | 
12 |     let port = 3000; // Default port
13 |     let base = '/';  // Default base
14 | 
15 |     try {
16 |         const fileUrl = pathToFileURL(configPath); // Use pathToFileURL for robustness
17 |         console.log(`Attempting to import astro.config.mjs from: ${fileUrl.href}`);
18 |         const { default: astroConfig } = await import(fileUrl.href);
19 |         if (astroConfig) {
20 |             base = astroConfig.base || '/';
21 |             // astro.config.mjs server.port might be a number or string, ensure it's used correctly
22 |             port = astroConfig.server?.port || port;
23 |             console.log(`Successfully loaded astro.config.mjs. Base: '${base}', Port: ${port}`);
24 |         } else {
25 |             console.warn('astro.config.mjs loaded but was empty or did not export a default. Using defaults.');
26 |         }
27 |     } catch (e) {
28 |         console.warn(`Could not load astro.config.mjs. Using default base '/' and port ${port}.`);
29 |         console.error(`Error details during astro.config.mjs load: ${e.message}`);
30 |     }
31 | 
32 |     let normalizedBase = base;
33 |     if (normalizedBase !== '/') {
34 |         if (!normalizedBase.startsWith('/')) {
35 |             normalizedBase = '/' + normalizedBase;
36 |         }
37 |         if (!normalizedBase.endsWith('/')) {
38 |             normalizedBase += '/';
39 |         }
40 |     }
41 | 
42 |     console.log(`Normalized base for URL construction: '${normalizedBase}'`);
43 |     
44 |     // Poll the base URL of the application. This should be a reliable target.
45 |     // Ensures normalizedBase (like '/' or '/path/') is correctly appended.
46 |     const pollUrl = `http://127.0.0.1:${port}${normalizedBase}`;
47 |     console.log(`Calculated pollUrl for start-server-and-test: ${pollUrl}`);
48 | 
49 |     const serverCommand = `astro preview --port ${port} --host`;
50 |     const testCommand = "npm run generate-pdf:local"; // This runs scripts/pdfgen.js
51 | 
52 |     const command = `start-server-and-test "${serverCommand}" "${pollUrl}" "${testCommand}"`;
53 |     console.log(`Executing command: ${command}`);
54 | 
55 |     try {
56 |         execSync(command, { stdio: 'inherit', cwd: projectRoot });
57 |     } catch (error) {
58 |         console.error('Failed to execute start-server-and-test command:', error);
59 |         process.exit(1);
60 |     }
61 | }
62 | 
63 | run();
64 | 


--------------------------------------------------------------------------------
/src/pages/editions/one-pager.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import '../../styles/global.css'
 3 | import '../../styles/one-pager.css'
 4 | 
 5 | import { CollectionEntry, Render, getCollection } from 'astro:content'
 6 | import DowngradeHeadings from '../../components/DowngradeHeadings.astro'
 7 | import ScrollPadding from '../../components/ScrollPadding.astro'
 8 | import ColoredTitle from '../../components/ColoredTitle.astro'
 9 | import { abstract } from '../../metadata'
10 | 
11 | const chapters = await getCollection('chapters')
12 | const rendered: [ CollectionEntry<'chapters'>, Awaited<Render['.mdx']> ][]
13 | 	= await Promise.all(chapters.map(async chapter => [ chapter, await chapter.render() ]))
14 | const baseUrl = import.meta.env.BASE_URL && import.meta.env.BASE_URL !== '/' ? `${import.meta.env.BASE_URL}/` : '/'
15 | 
16 | ---
17 | 
18 | <html lang='fa' dir='rtl'>
19 | <head>
20 | 	<meta charset='utf-8' />
21 | 	<meta name='viewport' content='width=device-width, initial-scale=1' />
22 | 	<base href={baseUrl} />
23 | 	<script>
24 | 		document.addEventListener('click', (e) => {
25 | 		const a = e.target.closest('a[href^="#"]');
26 | 		if (!a) return;
27 | 		e.preventDefault();
28 | 		const id = a.getAttribute('href').slice(1);
29 | 		document.getElementById(id)?.scrollIntoView();
30 | 		history.replaceState(null, '', '#' + id);
31 | 		});
32 | 	</script>
33 | 
34 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazirmatn@v33.003/Vazirmatn-font-face.css" rel="stylesheet" type="text/css" />
35 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazir-code-font@v1.1.2/dist/font-face.css" rel="stylesheet" type="text/css" />
36 | 
37 | 	<!-- <SEO chapterSlug='intro' /> -->
38 | 	<script defer data-domain='cpu.land' src='https://plausible.io/js/script.js' />
39 | </head>
40 | <body>
41 | 	<header>
42 | 		<div class='content'>
43 | 			<h1><ColoredTitle onDark /></h1>
44 | 			<p class='byline'>
45 | 				نوشته
46 | 				<a target='_blank' href='https://kognise.dev/'>لکسی متیک</a>
47 | 				و
48 | 				<a href='https://hackclub.com/'>هک کلاب</a>
49 | 				&middot;
50 | 				جولای ۲۰۲۳
51 | 			</p>
52 | 		</div>
53 | 		<div class='editions'>
54 | 			<div class='label'>نسخه‌ها</div>
55 | 			<div>
56 | 				<a href=''>معمولی</a> &middot;
57 | 				<strong>تک‌صفحه‌ای</strong> &middot;
58 | 				<a href='editions/printable.pdf'>PDF</a> <!--&middot;
59 | 				<a href='editions/book.epub'>EPUB</a>-->
60 | 			</div>
61 | 		</div>
62 | 		<img src={`${import.meta.env.BASE_URL}/squiggles/print.svg`} class='cover-bg' />
63 | 	</header>
64 | 
65 | 	<main>
66 | 		<div class='content'>
67 | 			{rendered.map(([ chapter, { Content } ]) => <>
68 | 				<h2 id={chapter.slug}>فصل {chapter.data.chapter}: {chapter.data.title}</h2>
69 | 				<DowngradeHeadings>
70 | 					<Content />
71 | 				</DowngradeHeadings>
72 | 			</>)}
73 | 
74 | 			<ScrollPadding hideEditions />
75 | 		</div>
76 | 	</main>
77 | </body>
78 | </html>
79 | 


--------------------------------------------------------------------------------
/src/components/CodeBlock.astro:
--------------------------------------------------------------------------------
  1 | ---
  2 | import theme from 'shiki/themes/one-dark-pro.json'
  3 | 
  4 | interface Props {
  5 | 	name?: string
  6 | 	startLine?: number
  7 | 	sourceUrl?: string
  8 | }
  9 | 
 10 | const { name, sourceUrl, startLine } = Astro.props
 11 | 
 12 | const slot = await Astro.slots.render('default')
 13 | const lineCount = slot.match(/class="line"/g).length
 14 | 
 15 | const background = theme.colors['editor.background']
 16 | const foreground = theme.colors['editor.foreground']
 17 | const lineNumbers = theme.colors['editorLineNumber.foreground']
 18 | ---
 19 | 
 20 | <figure class='code-block'>
 21 | 	{name ? (
 22 | 		<figcaption>
 23 | 			{sourceUrl ? (
 24 | 				<a href={sourceUrl} target='_blank' rel='noopener noreferrer'>
 25 | 					{name}
 26 | 				</a>
 27 | 			) : name}
 28 | 		</figcaption>
 29 | 	) : null}
 30 | 
 31 | 	<div class='pre-container'>
 32 | 		{startLine ? (
 33 | 			<pre class='line-numbers' aria-hidden='true'><code>{
 34 | 				new Array(lineCount).fill(0).map((_, i) => i + startLine).join('\n')
 35 | 			}</code></pre>
 36 | 		) : null}
 37 | 
 38 | 		<Fragment set:html={slot} />
 39 | 	</div>
 40 | </figure>
 41 | 
 42 | <style define:vars={{ background, foreground, lineNumbers }}>
 43 | 	figure {
 44 | 		background: var(--background);
 45 | 		padding: 8px 16px;
 46 | 		border-radius: 4px;
 47 | 		page-break-inside: avoid;
 48 | 	}
 49 | 
 50 | 	figcaption {
 51 | 		font-size: 0.9em;
 52 | 		color: var(--foreground);
 53 | 		font-family: var(--font-sans);
 54 | 
 55 | 		& a {
 56 | 			text-decoration: dotted underline;
 57 | 			text-underline-offset: 4px;
 58 | 		}
 59 | 
 60 | 		& a, & a:hover, & a:not([href^=\#]):visited, & a:not([href^=\#]):visited:hover {
 61 | 			color: inherit;
 62 | 			background: none;
 63 | 		}
 64 | 
 65 | 		& a::before, & a::after {
 66 | 			content: none;
 67 | 			display: none;
 68 | 		}
 69 | 	}
 70 | 
 71 | 	.pre-container {
 72 | 		padding: 10px 0;
 73 | 		display: flex;
 74 | 		flex-direction: row;
 75 | 		gap: 16px;
 76 | 		overflow-x: auto;
 77 | 		background: var(--background); /* <- needed so scrollbar is right theme */
 78 | 	}
 79 | 
 80 | 	figure :global(pre) {
 81 | 		line-height: 1.5;
 82 | 		margin: 0;
 83 | 		padding: 0;
 84 | 		overflow-x: visible !important;
 85 | 	}
 86 | 
 87 | 	.line-numbers {
 88 | 		color: var(--lineNumbers);
 89 | 		text-align: right;
 90 | 		user-select: none;
 91 | 	}
 92 | 
 93 | 	figure :global(pre):not(.line-numbers) {
 94 | 		flex: 1;
 95 | 	}
 96 | 
 97 | 	@media print {
 98 | 		figure, .pre-container, .pre-container :global(.astro-code) {
 99 | 			background: none !important;
100 | 		}
101 | 
102 | 		figure {
103 | 			border: 2px solid #ced4da;
104 | 		}
105 | 
106 | 		.line-numbers code {
107 | 			color: #868e96;
108 | 		}
109 | 
110 | 		figcaption {
111 | 			font-family: var(--font-serif);
112 | 			color: #495057;
113 | 
114 | 			& a {
115 | 				text-decoration: none;
116 | 			}
117 | 		}
118 | 	}
119 | </style>
120 | 


--------------------------------------------------------------------------------
/src/styles/chapter.css:
--------------------------------------------------------------------------------
  1 | :root {
  2 | 	--toc-width: 300px;
  3 | }
  4 | 
  5 | html, body {
  6 | 	overflow: hidden;
  7 | 	height: 100%;
  8 | }
  9 | 
 10 | body {
 11 | 	display: flex;
 12 | 	flex-direction: row-reverse;
 13 | 	gap: 10px;
 14 | }
 15 | 
 16 | main {
 17 | 	flex: 1;
 18 | 	display: flex;
 19 | 	flex-direction: column;
 20 | 	align-items: center;
 21 | 	overflow: auto;
 22 | 	padding-top: 100px;
 23 | }
 24 | 
 25 | nav.internal {
 26 | 	width: var(--toc-width);
 27 | 	color: var(--nav-color);
 28 | 	padding: 10px;
 29 | 	font-family: var(--font-sans);
 30 | 	font-size: 0.95em;
 31 | 	line-height: 1.7;
 32 | 	padding-top: 120px;
 33 | 	transition: opacity 200ms ease-in-out;
 34 | 	opacity: 0.5;
 35 | 
 36 | 	&:hover {
 37 | 		opacity: 1;
 38 | 	}
 39 | 
 40 | 	& h2 {
 41 | 		margin: 0;
 42 | 		margin-bottom: 10px;
 43 | 		font-size: 1.3em;
 44 | 		font-weight: 400;
 45 | 		color: #495057;
 46 | 	}
 47 | 
 48 | 	& ul:not(li ul) {
 49 | 		margin: 0;
 50 | 	}
 51 | 
 52 | 	& ul {
 53 | 		list-style-type: none;
 54 | 		font-weight: normal;
 55 | 		padding: 0;
 56 | 		padding-left: 30px;
 57 | 	}
 58 | 
 59 | 	& li {
 60 | 		margin: 4px 0;
 61 | 	}
 62 | 
 63 | 	& > ul {
 64 | 		padding-left: 0;
 65 | 	}
 66 | 
 67 | 	& a {
 68 | 		--color: #868e96;
 69 | 		--hover-background: transparent;
 70 | 		display: block;
 71 | 		padding: 0 4px;
 72 | 
 73 | 		&.scrollspy-active {
 74 | 			--color: #343a40;
 75 | 		}
 76 | 
 77 | 		&:hover {
 78 | 			--color: #000000;
 79 | 		}
 80 | 	}
 81 | 
 82 | 	& .navigation {
 83 | 		display: flex;
 84 | 		flex-direction: row;
 85 | 		justify-content: space-between;
 86 | 		margin-top: 10px;
 87 | 
 88 | 		& a {
 89 | 			padding: 0 6px;
 90 | 		}
 91 | 	}
 92 | }
 93 | 
 94 | h1 {
 95 | 	font-size: 1em;
 96 | 	font-family: var(--font-sans);
 97 | 
 98 | 	& .chapter {
 99 | 		font-weight: normal;
100 | 		color: #495057;
101 | 		margin-bottom: 2px;
102 | 	}
103 | 
104 | 	& .title {
105 | 		font-weight: 600;
106 | 		font-size: 1.9em;
107 | 	}
108 | }
109 | 
110 | .you-are-here {
111 | 	width: 100%;
112 | 	background: #e9ecef;
113 | 	display: flex;
114 | 	flex-direction: column;
115 | 	align-items: center;
116 | 	padding: 5px 0;
117 | 	margin: 10px 0;
118 | 	line-height: 1.7;
119 | 	font-size: 0.95em;
120 | 
121 | 	& p {
122 | 		margin: 5px 0;
123 | 		font-style: italic;
124 | 	}
125 | }
126 | 
127 | @media (max-width: 720px) {
128 | 	:root {
129 | 		--toc-width: 0px;
130 | 	}
131 | 
132 | 	nav.internal {
133 | 		display: none;
134 | 	}
135 | 
136 | 	html, body, main {
137 | 		overflow: auto;
138 | 	}
139 | }
140 | 
141 | @media (max-width: 420px) {
142 | 	main {
143 | 		padding-top: 40px;
144 | 	}
145 | 
146 | 	.you-are-here p {
147 | 		margin-top: 0;
148 | 		margin-bottom: 10px;
149 | 	}
150 | }
151 | 
152 | @media print {
153 | 	:root {
154 | 		--toc-width: 0px;
155 | 	}
156 | 
157 | 	header {
158 | 		font-size: 1.1em;
159 | 		text-align: center;
160 | 	}
161 | 
162 | 	nav.internal, .you-are-here {
163 | 		display: none;
164 | 	}
165 | 
166 | 	main {
167 | 		padding: 0;
168 | 	}
169 | 
170 | 	html, body, main {
171 | 		overflow: visible;
172 | 	}
173 | }


--------------------------------------------------------------------------------
/src/components/ExternalNav.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getCollection, getEntryBySlug, CollectionEntry} from 'astro:content'
 3 | 
 4 | export interface Props {
 5 | 	currentChapterSlug: CollectionEntry<'chapters'>['slug']
 6 | 	noScript?: boolean
 7 | }
 8 | 
 9 | const { currentChapterSlug, noScript } = Astro.props
10 | const allChapters = await getCollection('chapters')
11 | const currentChapter = await getEntryBySlug('chapters', currentChapterSlug)
12 | ---
13 | 
14 | <nav class='external' id='external-nav' aria-label='جابجایی بین فصل‌ها'>
15 | 	<ul>
16 | 		{allChapters.map((chapter, index) => (
17 | 				<li
18 | 					class={`
19 | 						${chapter.slug === currentChapterSlug ? 'active' : ''}
20 | 						${Math.abs(
21 | 							index - Math.max(Math.min(currentChapter.data.chapter, allChapters.length - 3), 2)
22 | 						) > 2 ? 'md-hide' : ''}
23 | 						${Math.abs(
24 | 							index - Math.max(Math.min(currentChapter.data.chapter, allChapters.length - 2), 1)
25 | 						) > 1 ? 'sm-hide' : ''}
26 | 					`}
27 | 					style={`opacity: ${[0.7, 0.5, 0.4, 0.3][Math.abs(index - currentChapter.data.chapter)] ?? 0.2}`}
28 | 				>
29 | 					<a
30 | 						href={chapter.data.chapter === 0 ? '' : chapter.slug}
31 | 						aria-current={chapter.slug === currentChapterSlug ? 'page' : undefined}
32 | 					>
33 | 						<div class='chapter'>فصل {chapter.data.chapter}</div>
34 | 						<div class='title'>{chapter.data.shortname}</div>
35 | 					</a>
36 | 				</li>
37 | 			))
38 | 		}
39 | 	</ul>
40 | </nav>
41 | 
42 | <script define:vars={{ noScript }}>
43 | 	if (noScript) window.__CPU_EXTERNAL_NAV_NOSCRIPT__ = true
44 | </script>
45 | <script>
46 | 	// External nav hide on scroll effect
47 | 	const externalNav: HTMLElement = document.querySelector('#external-nav')
48 | 
49 | 	const showThreshold = 80
50 | 	const hideThreshold = 80
51 | 	let visible = true
52 | 
53 | 	function addNavScrollHider(scroller: HTMLElement, eventSource: Window | HTMLElement = scroller) {
54 | 		let farthestPoint = scroller.scrollTop
55 | 
56 | 		eventSource.addEventListener('scroll', () => {
57 | 			if (visible) {
58 | 				farthestPoint = Math.min(farthestPoint, scroller.scrollTop)
59 | 
60 | 				if (scroller.scrollTop - farthestPoint > hideThreshold) {
61 | 					// We scrolled down.
62 | 					console.log('Hiding external nav')
63 | 					farthestPoint = scroller.scrollTop
64 | 					externalNav.style.transform = `translateY(-100%)`
65 | 					visible = false
66 | 				}
67 | 			} else if (!visible) {
68 | 				farthestPoint = Math.max(farthestPoint, scroller.scrollTop)
69 | 
70 | 				if (scroller.scrollTop - farthestPoint < -showThreshold) {
71 | 					// We scrolled up.
72 | 					console.log('Showing external nav')
73 | 					farthestPoint = scroller.scrollTop
74 | 					externalNav.style.transform = `translateY(0)`
75 | 					visible = true
76 | 				}
77 | 			}
78 | 		}, { passive: true })
79 | 	}
80 | 
81 | 	/* @ts-ignore-line */
82 | 	if (!window.__CPU_EXTERNAL_NAV_NOSCRIPT__) {
83 | 		// We need multiple for resilience with responsive changes to overflowing elements.
84 | 		addNavScrollHider(document.querySelector('main'))
85 | 		addNavScrollHider(document.documentElement, window)
86 | 	}
87 | </script>
88 | 


--------------------------------------------------------------------------------
/src/pages/index.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import '../styles/global.css'
 3 | import '../styles/home.css'
 4 | 
 5 | import { getEntryBySlug } from 'astro:content'
 6 | import SEO from '../components/SEO.astro'
 7 | import ColoredTitle from '../components/ColoredTitle.astro'
 8 | import ExternalNav from '../components/ExternalNav.astro'
 9 | import EditButton from '../components/EditButton.astro'
10 | import ScrollPadding from '../components/ScrollPadding.astro'
11 | 
12 | const intro = await getEntryBySlug('chapters', 'intro')
13 | const chapterOne = await getEntryBySlug('chapters', 'the-basics')
14 | const { Content: Intro } = await intro.render()
15 | const baseUrl = import.meta.env.BASE_URL && import.meta.env.BASE_URL !== '/' ? `${import.meta.env.BASE_URL}/` : '/'
16 | 
17 | ---
18 | 
19 | <html lang='fa' dir='rtl'>
20 | <head>
21 | 	<meta charset='utf-8' />
22 | 	<meta name='viewport' content='width=device-width, initial-scale=1' />
23 | 	<base href={baseUrl} />
24 | 	<script>
25 | 		document.addEventListener('click', (e) => {
26 | 		const a = e.target.closest('a[href^="#"]');
27 | 		if (!a) return;
28 | 		e.preventDefault();
29 | 		const id = a.getAttribute('href').slice(1);
30 | 		document.getElementById(id)?.scrollIntoView();
31 | 		history.replaceState(null, '', '#' + id);
32 | 		});
33 | 	</script>
34 | 
35 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazirmatn@v33.003/Vazirmatn-font-face.css" rel="stylesheet" type="text/css" />
36 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazir-code-font@v1.1.2/dist/font-face.css" rel="stylesheet" type="text/css" />
37 | 
38 | 	<SEO chapterSlug='intro' />
39 | 	<script defer data-domain='cpu.land' src='https://plausible.io/js/script.js' />
40 | </head>
41 | <body>
42 | 	<a class='orpheus-flag' target='_blank' href='https://hackclub.com/'>
43 | 		<img src='orpheus-flag.svg' width='560' height='315' alt='پروژه‌ای از هک کلاب' title='پروژه‌ای از هک کلاب' />
44 | 	</a>
45 | 
46 | 	<header>
47 | 		<img src='squiggles/top.svg' class='squiggles top' alt='' aria-hidden='true' />
48 | 		<div class='content'>
49 | 			<h1><ColoredTitle onDark /></h1>
50 | 			<p class='abstract'>کنجکاوید که دقیقاً چه اتفاقی می‌افته وقتی برنامه‌ای رو روی کامپیوترتون اجرا می‌کنید؟ این مقاله رو بخونید تا یاد بگیرید چطور چندپردازشی کار می‌کنه، فراخوانی‌های سیستم واقعاً چی هستن، کامپیوترها چطور حافظه رو با وقفه‌های سخت‌افزاری مدیریت می‌کنن، و لینوکس چطور فایل‌های اجرایی رو بارگذاری می‌کنه.</p>
51 | 			<p>
52 | 				نوشته
53 | 				<a target='_blank' href='https://kognise.dev/'>لکسی متیک</a>
54 | 				و
55 | 				<a href='https://hackclub.com/'>هک کلاب</a>
56 | 				&middot;
57 | 				ژانویه ۲۰۲۳
58 | 			</p>
59 | 		</div>
60 | 		<img src='squiggles/bottom.svg' class='squiggles bottom' alt='' aria-hidden='true' />
61 | 	</header>
62 | 	<ExternalNav noScript currentChapterSlug='intro' />
63 | 
64 | 	<main>
65 | 		<div class='content'>
66 | 			<h2 id='from-the-beginning'>
67 | 				از همون اول&hellip;
68 | 				<EditButton chapterSlug='intro' />
69 | 			</h2>
70 | 
71 | 			<Intro />
72 | 
73 | 			<a class='continue' href='the-basics'>
74 | 				ادامه به فصل ۱: {chapterOne.data.title}
75 | 				<span aria-hidden='true'>&raquo;</span>
76 | 			</a>
77 | 		</div>
78 | 
79 | 		<ScrollPadding />
80 | 	</main>
81 | </body>
82 | </html>
83 | 


--------------------------------------------------------------------------------
/src/components/SEO.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getEntryBySlug, CollectionEntry } from 'astro:content'
 3 | 
 4 | interface Props {
 5 | 	chapterSlug: CollectionEntry<'chapters'>['slug']
 6 | }
 7 | 
 8 | const { chapterSlug } = Astro.props
 9 | const chapter = await getEntryBySlug('chapters', chapterSlug)
10 | 
11 | const bannerUrl = new URL('/banner.png', Astro.site)
12 | const bannerAlt = ''
13 | const bannerWidth = 1280
14 | const bannerHeight = 640
15 | 
16 | const canonicalUrl = new URL(Astro.url.pathname, Astro.site)
17 | canonicalUrl.pathname = canonicalUrl.pathname.replace(/\/$/, '') // Strip slash from the end of the path
18 | 
19 | const description = 'Curious exactly what happens when you run a program on your computer? Learn how multiprocessing works, what system calls really are, how computers manage memory with hardware interrupts, and how Linux loads executables.'
20 | const publishedAt = new Date(2023, 6, 17)
21 | const articleTitle = 'Putting the "You" in CPU'
22 | const chapterTitle = chapter.data.title.replace(/[“”]/g, '"')
23 | const keywords = [ 'unix', 'linux', 'mmu', 'paging', 'memory management', 'cpu', 'program execution', 'elf', 'elf format', 'timeslicing', 'fork', 'cow' ]
24 | ---
25 | 
26 | <title>{`${chapterTitle} | ${articleTitle}`}</title>
27 | <meta property='og:title' content={chapter.data.chapter === 0 ? articleTitle : chapterTitle} />
28 | <meta property='og:site_name' content={articleTitle} />
29 | 
30 | <meta name='description' content={description} />
31 | <meta property='og:description' content={description}>
32 | 
33 | <meta property='og:url' content={canonicalUrl} />
34 | <link rel='canonical' href={canonicalUrl} />
35 | 
36 | <meta property='og:image' content={bannerUrl} />
37 | <meta property='og:image:alt' content={bannerAlt} />
38 | <meta property='og:image:width' content={bannerWidth.toString()} />
39 | <meta property='og:image:height' content={bannerHeight.toString()} />
40 | 
41 | <meta name='robots' content='index,follow' />
42 | <meta name='googlebot' content='index,follow' />
43 | <meta name='twitter:card' content='summary_large_image' />
44 | <meta name='twitter:site' content='@hackclub' />
45 | <meta name='twitter:creator' content='@hackclub' />
46 | <meta property='og:type' content='article' />
47 | <meta property='og:locale' content='en_US' />
48 | 
49 | <meta name='keywords' content={keywords.join(',')} />
50 | <meta name='theme-color' content='#845ef7' />
51 | <link rel='icon' href='favicon-on-dark.png' media='(prefers-color-scheme: dark)' />
52 | <link rel='icon' href='favicon-on-light.png' media='(prefers-color-scheme: light)' />
53 | 
54 | <link rel='sitemap' href='/sitemap-index.xml' />
55 | 
56 | <meta property='article:published_time' content={publishedAt.toISOString()} />
57 | <meta property='article:modified_time' content={chapter.data.updatedAt.toISOString()} />
58 | <meta property='article:author:first_name' content='Lexi' />
59 | <meta property='article:author:last_name' content='Mattick' />
60 | <meta property='article:author:username' content='Kognise' />
61 | <meta property='article:author:gender' content='female' />
62 | {keywords.map(keyword => <meta property='article:tag' content={keyword} />)}
63 | 
64 | <script
65 | 	type='application/ld+json'
66 | 	set:html={JSON.stringify({
67 | 		'@context': 'https://schema.org',
68 | 		'@type': 'Article',
69 | 		'headline': `${chapterTitle} - ${articleTitle}`,
70 | 		'abstract': description,
71 | 		'image': [
72 | 			{
73 | 				contentUrl: bannerUrl,
74 | 				width: bannerWidth,
75 | 				height: bannerHeight,
76 | 				caption: bannerAlt
77 | 			}
78 | 		],
79 | 		'dateCreated': publishedAt.toISOString(),
80 | 		'datePublished': publishedAt.toISOString(),
81 | 		'dateModified': chapter.data.updatedAt.toISOString(),
82 | 		'author': [
83 | 			{
84 | 				'@type': 'Person',
85 | 				'name': 'Lexi Mattick',
86 | 				'url': 'https://kognise.dev/'
87 | 			}
88 | 		]
89 | 	})}
90 | />
91 | 


--------------------------------------------------------------------------------
/src/styles/one-pager.css:
--------------------------------------------------------------------------------
  1 | /* honestly all these styles are a bit of a clusterfuck */
  2 | 
  3 | @font-face {
  4 | 	font-family: 'Phantom Sans';
  5 | 	src: url('https://assets.hackclub.com/fonts/Phantom_Sans_0.7/SemiBold.woff')
  6 | 		format('woff'),
  7 | 		url('https://assets.hackclub.com/fonts/Phantom_Sans_0.7/SemiBold.woff2')
  8 | 		format('woff2');
  9 | 	font-weight: 600;
 10 | 	font-style: normal;
 11 | 	font-display: swap;
 12 | }
 13 | 
 14 | .cover-bg {
 15 | 	display: none;
 16 | }
 17 | 
 18 | header {
 19 | 	background: #212529;
 20 | 	background: linear-gradient(90deg, #212529 28px, transparent 1%) center, linear-gradient(#212529 28px, transparent 1%) center, #495057;
 21 |     background-size: 30px 30px;
 22 | 	text-align: center;
 23 | 	display: flex;
 24 | 	flex-direction: column;
 25 | 	align-items: center;
 26 | 	color: #ced4da;
 27 | 	padding: 100px 0;
 28 | 	position: relative;
 29 | 
 30 | 	& p {
 31 | 		margin: 0;
 32 | 	}
 33 | 
 34 | 	& .editions {
 35 | 		background: #343a40;
 36 | 		width: fit-content;
 37 | 		padding: 6px 30px;
 38 | 		display: flex;
 39 | 		flex-direction: column;
 40 | 		align-items: center;
 41 | 		justify-content: center;
 42 | 		height: 4.4em;
 43 | 		position: absolute;
 44 | 		top: calc(100% - 2.2em);
 45 | 		border-radius: 2.2em;
 46 | 
 47 | 		& .label {
 48 | 			font-size: 0.9em;
 49 | 			color: #868e96;
 50 | 			line-height: 1.2;
 51 | 		}
 52 | 
 53 | 		& a {
 54 | 			margin: 0; /* on firefox, the negative margin breaks layout with fit-content */
 55 | 		}
 56 | 
 57 | 		& strong {
 58 | 			color: #dee2e6;
 59 | 		}
 60 | 	}
 61 | 
 62 | 	& h1 {
 63 | 		font-family: var(--font-main-title);
 64 | 		font-size: 2.5em;
 65 | 		font-weight: 600;
 66 | 		margin: 0;
 67 | 		margin-bottom: 14px;
 68 | 	}
 69 | 
 70 | 	& .content p {
 71 | 		line-height: 1.7;
 72 | 		font-size: 1.05em;
 73 | 	}
 74 | 
 75 | 	& a, & a:not([href^="#"]):visited {
 76 | 		--color: currentColor;
 77 | 		--hover-background: #343a40;
 78 | 		text-decoration: underline;
 79 | 		text-decoration-color: #9775fa;
 80 | 		text-underline-offset: 4px;
 81 | 	}
 82 | 
 83 | 	& .editions a, & .editions a:not([href^="#"]):visited {
 84 | 		--hover-background: #495057;
 85 | 	}
 86 | }
 87 | 
 88 | main {
 89 | 	display: flex;
 90 | 	flex-direction: column;
 91 | 	align-items: center;
 92 | }
 93 | 
 94 | h2 {
 95 | 	margin-top: 140px;
 96 | }
 97 | 
 98 | h2:first-of-type {
 99 | 	margin-top: 80px;
100 | }
101 | 
102 | @page { 
103 |     size: auto;
104 |     margin: 0.8in 0in;
105 | }
106 | 
107 | @media print {
108 | 	header {
109 | 		background: transparent;
110 | 		padding: 0;
111 | 		position: static;
112 | 
113 | 		& .editions {
114 | 			display: none;
115 | 		}
116 | 
117 | 		& h1 {
118 | 			margin-top: 32vh;
119 | 			font-size: 3.25em;
120 | 		}
121 | 
122 | 		& .byline {
123 | 			font-size: 1.5em;
124 | 			color: #000000;
125 | 		}
126 | 
127 | 		& a {
128 | 			text-decoration: none;
129 | 		}
130 | 	}
131 | 
132 | 	.cover-bg {
133 | 		display: block;
134 | 		position: absolute;
135 | 		object-fit: contain;
136 | 		top: 0;
137 | 		left: 0;
138 | 		width: 100%;
139 | 		height: 100%;
140 | 		z-index: -1;
141 | 		opacity: 0.75;
142 | 	}
143 | 
144 | 	h2, h2:first-of-type {
145 | 		margin-top: 0;
146 | 		font-size: 1.9em;
147 | 		margin-bottom: 35px;
148 | 		text-align: center;
149 | 		page-break-before: always;
150 | 		page-break-after: avoid;
151 | 		page-break-inside: avoid;
152 | 	}
153 | 
154 | 	h3 {
155 | 		font-size: 1.5em;
156 | 		margin-bottom: 20px;
157 | 		margin-top: 40px;
158 | 	}
159 | 
160 | 	h4 {
161 | 		font-size: 1.3em;
162 | 		margin-bottom: 15px;
163 | 	}
164 | 
165 | 	.content {
166 | 		/* All widths are calculated based on first-page margins, so our content gets
167 | 		 * cut off if we do layout with normal @page rules. Instead, we use 0in margin
168 | 		 * in the @page and add in our 1.2in horizontal margin here. */
169 | 		max-width: calc(100% - 1.6in);
170 | 	}
171 | }


--------------------------------------------------------------------------------
/src/content/chapters/7-epilogue.mdx:
--------------------------------------------------------------------------------
 1 | ---
 2 | chapter: 7
 3 | title: Epilogue
 4 | shortname: Epilogue
 5 | slug: epilogue
 6 | updatedAt: 2023-07-18T18:59:25.355Z
 7 | ---
 8 | 
 9 | Congratulations! We have now firmly placed the "you" in CPU. I hope you had fun.
10 | 
11 | I will send you off by emphasizing once more that all the knowledge you just gained is real and active. The next time you think about how your computer is running multiple apps, I hope you envision timer chips and hardware interrupts. When you write a program in some fancy programming language and get a linker error, I hope you think about what that linker is trying to do.
12 | 
13 | If you have any questions (or corrections) about anything contained in this article, you should email me at [lexi@hackclub.com](mailto:lexi@hackclub.com) or submit an issue or PR [on GitHub](https://github.com/hackclub/putting-the-you-in-cpu/).
14 | 
15 | <img src='images/the-end.png' loading='eager' alt='The end.' width='1367' height='331' style='max-width: 600px; margin: 30px auto; margin-bottom: 150px;' />
16 | 
17 | ... but wait, there's more!
18 | 
19 | ## Bonus: Translating C Concepts
20 | 
21 | If you've done some low-level programming yourself, you probably know what the stack and the heap are and you've probably used `malloc`. You might not have thought a lot about how they're implemented!
22 | 
23 | First of all, a thread's stack is a fixed amount of memory that's mapped to somewhere high up in virtual memory. On most (although [not all](https://stackoverflow.com/a/664779)) architectures, the stack pointer starts at the top of the stack memory and moves downward as it increments. Physical memory is not allocated up-front for the entire mapped stack space; instead, demand paging is used to lazily allocate memory as frames of the stack are reached.
24 | 
25 | It might be surprising to hear that heap allocation functions like `malloc` are not system calls. Instead, heap memory management is provided by the libc implementation! `malloc`, `free`, et al. are complex procedures, and the libc keeps track of memory mapping details itself. Under the hood, the userland heap allocator uses syscalls including `mmap` (which can map more than just files) and `sbrk`.
26 | 
27 | ## Bonus: Tidbits
28 | 
29 | I couldn't find anywhere coherent to put these, but found them amusing, so here you go.
30 | 
31 | > *Most Linux users probably have a sufficiently interesting life that they spend little time imagining how page tables are represented in the kernel.*
32 | > 
33 | > *<cite>[Jonathan Corbet, LWN](https://lwn.net/Articles/106177/)</cite>*
34 | 
35 | An alternate visualization of hardware interrupts:
36 | 
37 | <img src='images/hardware-interrupt-meme.png' loading='lazy' style='max-width: 350px;' alt='A 4-panel meme comic depicting a small bird on a branch, with speech bubbles containing assembly instructions. In the second panel, another speech bubble appears from out of frame, shouting "hello it&apos;s me the keyboard!" In the third panel, the source of the shouting is visible as a large crow in frame, now shouting "I have an important message!" In the final frame, a close up on the small bird looking unamused. Another speech bubble from the crow out of frame bears simply the letter E.' width='600' height='625' />
38 | 
39 | A note that some system calls use a technique called vDSOs instead of jumping into kernel space. I didn't have time to talk about this, but it's quite interesting and I recommend [reading](https://en.wikipedia.org/wiki/VDSO) [into](https://man7.org/linux/man-pages/man7/vdso.7.html) [it](https://0xax.gitbooks.io/linux-insides/content/SysCall/linux-syscall-3.html).
40 | 
41 | And finally, addressing the Unix allegations: I do feel bad that a lot of the execution-specific stuff is very Unix-specific. If you're a macOS or Linux user this is fine, but it won't bring you too much closer to how Windows executes programs or handles system calls, although the CPU architecture stuff is all the same. In the future I would love to write an article that covers the Windows world.
42 | 
43 | ## Acknowledgements
44 | 
45 | I talked to GPT-3.5 and GPT-4 a decent amount while writing this article. While they lied to me a lot and most of the information was useless, they were sometimes very helpful for working through problems. LLM assistance can be net positive if you're aware of their limitations and are extremely skeptical of everything they say. That said, they're terrible at writing. Don't let them write for you.
46 | 
47 | More importantly, thank you to all the humans who proofread me, encouraged me, and helped me brainstorm — especially Ani, B, Ben, Caleb, Kara, polypixeldev, Pradyun, Spencer, Nicky (who drew the wonderful elf in [chapter 4](/becoming-an-elf-lord)), and my lovely parents.
48 | 
49 | If you are a teenager and you like computers and you are not already in the [Hack Club Slack](https://hackclub.com/slack), you should join right now. I would not have written this article if I didn't have a community of awesome people to share my thoughts and progress with. If you are not a teenager, you should [give us money](https://hackclub.com/philanthropy/) so we can keep doing cool things.
50 | 
51 | All of the mediocre art in this article was drawn in [Figma](https://figma.com/). I used [Obsidian](https://obsidian.md/) for editing, and sometimes [Vale](https://vale.sh/) for linting. The Markdown source for this article is [available on GitHub](https://github.com/hackclub/putting-the-you-in-cpu/) and open to future nitpicks, and all art is published on a [Figma community page](https://www.figma.com/community/file/1260699047973407903).
52 | 
53 | <img src='images/cpu-pleading-face.png' loading='lazy' alt='A CPU with an adorable pleading face.' width='280' height='280' style='max-width: 120px; margin: 0 auto;' />
54 | 


--------------------------------------------------------------------------------
/src/pages/[...slug].astro:
--------------------------------------------------------------------------------
  1 | ---
  2 | import '../styles/global.css'
  3 | import '../styles/chapter.css'
  4 | 
  5 | import { CollectionEntry, getCollection, getEntryBySlug } from 'astro:content'
  6 | import TOCList from '../components/TOCList.astro'
  7 | import SEO from '../components/SEO.astro'
  8 | import ExternalNav from '../components/ExternalNav.astro'
  9 | import ColoredTitle from '../components/ColoredTitle.astro'
 10 | import EditButton from '../components/EditButton.astro'
 11 | import ScrollPadding from '../components/ScrollPadding.astro'
 12 | import OldNav from '../components/OldNav.astro'
 13 | 
 14 | const baseUrl = import.meta.env.BASE_URL && import.meta.env.BASE_URL !== '/' ? `${import.meta.env.BASE_URL}/` : '/'
 15 | 
 16 | export interface Params {
 17 | 	slug: CollectionEntry<'chapters'>['slug']
 18 | }
 19 | 
 20 | const chapter = await getEntryBySlug('chapters', Astro.params.slug)
 21 | const { Content, headings } = await chapter.render()
 22 | 
 23 | const allChapters = await getCollection('chapters')
 24 | const prevChapter = allChapters
 25 | 	.find(otherChapter => otherChapter.data.chapter === chapter.data.chapter - 1)
 26 | const nextChapter = allChapters
 27 | 	.find(otherChapter => otherChapter.data.chapter === chapter.data.chapter + 1)
 28 | 
 29 | export async function getStaticPaths() {
 30 | 	const chapters = await getCollection('chapters')
 31 | 	return chapters
 32 | 		.filter(chapter => chapter.data.chapter !== 0) // Skip the intro
 33 | 		.map(chapter => ({ params: { slug: chapter.slug } }))
 34 | }
 35 | ---
 36 | 
 37 | <html lang='fa' dir='rtl'>
 38 | <head>
 39 | 	<meta charset='utf-8' />
 40 | 	<meta name='viewport' content='width=device-width, initial-scale=1' />
 41 | 	<base href={baseUrl} />
 42 | 	<script>
 43 | 		document.addEventListener('click', (e) => {
 44 | 		const a = e.target.closest('a[href^="#"]');
 45 | 		if (!a) return;
 46 | 		e.preventDefault();
 47 | 		const id = a.getAttribute('href').slice(1);
 48 | 		document.getElementById(id)?.scrollIntoView();
 49 | 		history.replaceState(null, '', '#' + id);
 50 | 		});
 51 | 	</script>
 52 | 
 53 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazirmatn@v33.003/Vazirmatn-font-face.css" rel="stylesheet" type="text/css" />
 54 | 	<link href="https://cdn.jsdelivr.net/gh/rastikerdar/vazir-code-font@v1.1.2/dist/font-face.css" rel="stylesheet" type="text/css" />
 55 | 
 56 | 	<SEO chapterSlug={chapter.slug} />
 57 | 	<script defer data-domain='cpu.land' src='https://plausible.io/js/script.js' />
 58 | </head>
 59 | <body>
 60 | 	<ExternalNav currentChapterSlug={chapter.slug} />
 61 | 
 62 | 	<nav class='internal'>
 63 | 		<h2>فهرست فصل</h2>
 64 | 		
 65 | 		<TOCList headings={[
 66 | 			{ depth: 2, text: 'مقدمه', slug: 'intro' },
 67 | 			...headings
 68 | 		]} />
 69 | 
 70 | 		<div class='navigation'>
 71 | 			{prevChapter ? (
 72 | 				<a href={prevChapter.data.chapter === 0 ? '' : prevChapter.slug}>
 73 | 					<span aria-hidden='true'>&laquo;</span>
 74 | 					<span class='sr-only'>قبلی:</span>
 75 | 					{prevChapter.data.chapter === 0 ? 'مقدمه' : `فصل ${prevChapter.data.chapter}`}
 76 | 				</a>
 77 | 			) : null}
 78 | 			{nextChapter ? (
 79 | 				<a href={nextChapter.slug}>
 80 | 					<span class='sr-only'>بعدی:</span>
 81 | 					{nextChapter.data.chapter === 0 ? 'مقدمه' : `فصل ${nextChapter.data.chapter}`}
 82 | 					<span aria-hidden='true'>&raquo;</span>
 83 | 				</a>
 84 | 			) : null}
 85 | 		</div>
 86 | 	</nav>
 87 | 
 88 | 	<main>
 89 | 		<header class='content'>
 90 | 			<h1 id='intro'>
 91 | 				<div class='chapter'>فصل {chapter.data.chapter}<span class='sr-only'>:</span></div>
 92 | 				<div class='title'>
 93 | 					{chapter.data.title}
 94 | 					<EditButton chapterSlug={chapter.slug} />
 95 | 				</div>
 96 | 			</h1>
 97 | 		</header>
 98 | 
 99 | 		<div class='you-are-here'>
100 | 			<div class='content'>
101 | 				<p>بخشی از <a href='' style='--color: transparent;'><ColoredTitle /></a>: کاوشی عمیق در نحوهٔ اجرای برنامه‌ها توسط کامپیوتر شما.</p>
102 | 				<OldNav chapterSlug={chapter.slug} />
103 | 			</div>
104 | 		</div>
105 | 
106 | 		<div class='content'>
107 | 			<Content />
108 | 
109 | 			{nextChapter ? (
110 | 				<a class='continue' href={nextChapter.slug}>
111 | 					ادامه خواندن توی فصل {nextChapter.data.chapter}: {nextChapter.data.title} <span aria-hidden='true'>&raquo;</span>
112 | 				</a>
113 | 			) : null}
114 | 		</div>
115 | 
116 | 		<ScrollPadding />
117 | 	</main>
118 | 
119 | 	<script define:vars={{ dev: import.meta.env.DEV }}>
120 | 		window.__ASTRO_DEV_MODE__ = dev
121 | 	</script>
122 | 	<script>
123 | 		const scrollRestoreKey = `scroll-restore-${window.location.pathname}`
124 | 
125 | 		// Scrollspy
126 | 		const leeway = 80
127 | 		const container = document.querySelector('main')
128 | 		const headings = [ ...document.querySelectorAll('h1, h2, h3, h4, h5, h6') ]
129 | 			.filter(el => !!el.id)
130 | 		headings.reverse()
131 | 
132 | 		let current = 'intro'
133 | 		const updateScrollspy = () => {
134 | 			for (const el of document.querySelectorAll('[data-scrollspy]')) {
135 | 				el.classList.toggle('scrollspy-active', el.dataset.scrollspy === current)
136 | 			}
137 | 		}
138 | 		
139 | 		container.addEventListener('scroll', () => {
140 | 			let next = 'intro'
141 | 			for (const heading of headings) {
142 | 				if (container.scrollTop >= heading.offsetTop - leeway) {
143 | 					next = heading.id
144 | 					break
145 | 				}
146 | 			}
147 | 			if (next !== current) {
148 | 				current = next
149 | 				updateScrollspy()
150 | 			}
151 | 
152 | 			if (window.__ASTRO_DEV_MODE__) {
153 | 				sessionStorage.setItem(scrollRestoreKey, container.scrollTop.toString())
154 | 			}
155 | 		}, { passive: true })
156 | 
157 | 		updateScrollspy()
158 | 
159 | 		// Restore scroll for live reloading
160 | 		setTimeout(() => {
161 | 			if (window.__ASTRO_DEV_MODE__ && sessionStorage.getItem(scrollRestoreKey)) {
162 | 				container.scrollTop = parseInt(sessionStorage.getItem(scrollRestoreKey))
163 | 			}
164 | 		}, 0)
165 | 	</script>
166 | </body>
167 | </html>
168 | 


--------------------------------------------------------------------------------
/public/orpheus-flag.svg:
--------------------------------------------------------------------------------
1 | <svg fill="none" height="158" viewBox="0 0 280 158" width="280" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><clipPath id="a"><path d="m0 0h280v157.5h-280z"/></clipPath><mask id="b" fill="#fff"><path clip-rule="evenodd" d="m119.139 32.1697c1.704-.2978 26.048-3.4959 61.254 38.26 33.255 39.4423 86.743 34.9053 96.572 33.6093.326-.044.571.555.314.759l-14.498 11.557c-.228.182-.188.54.077.663 1.996.933 8.965 4.169 16.855 7.598.327.141.345.595.008.712-7.507 2.598-60.039 19.928-89.231 6.781-31.489-14.184-45.229-29.22-62.86-43.852-17.362-14.4078-27.591-21.7065-40.63-25.1565 0 0 24.99-23.6826 30.843-29.6253.818-.8304 1.288-1.304 1.296-1.3055z" fill="#fff" fill-rule="evenodd"/></mask><g clip-path="url(#a)"><path clip-rule="evenodd" d="m5.45606 0s-.3039 2.70449-.69789 7.14273c-1.40365 15.81157-3.950845 53.62777 2.0254 69.55647 7.65373 20.3998 19.87993 21.2998 19.87993 21.2998s60.6336-40.9996 60.3354-39.6996-.994-5-7.952-16.6998c-6.958-11.6999-7.0163-35.89966-7.0163-41.5996" fill="#fff" fill-rule="evenodd"/><path d="m5.3201 0s-6.14102 56.2994 1.55887 76.6992c7.69983 20.3998 23.76283 22.8606 23.76283 22.8606s59.041-33.1191 58.0006-38.9253c-1.0405-5.8063-4.0043-11.2981-11.0042-22.9979-6.9999-11.6999-5.0689-31.93666-5.0689-37.6366" stroke="#17171d" stroke-linecap="round" stroke-linejoin="round" stroke-width="3"/><g clip-rule="evenodd" fill-rule="evenodd"><path d="m88.0918 59.7661c-3.0082-3.4742-9.0999-11.1999-38.3995 5.9999s-25.8996 30.0997-22.4997 32.3996c3.4 2.3004 11.0999 5.6004 41.0994-6.5999 29.9996-12.1998 22.808-28.3254 19.7998-31.7996z" fill="#fff" stroke="#17171d" stroke-linecap="round" stroke-linejoin="round" stroke-width="3"/><path d="m119.139 32.1697c1.704-.2978 26.048-3.4959 61.254 38.26 33.255 39.4423 86.743 34.9053 96.572 33.6093.326-.044.571.555.314.759l-14.498 11.557c-.228.182-.188.54.077.663 1.996.933 8.965 4.169 16.855 7.598.327.141.345.595.008.712-7.507 2.598-60.039 19.928-89.231 6.781-31.489-14.184-45.229-29.22-62.86-43.852-17.362-14.4078-27.591-21.7065-40.63-25.1565 0 0 24.99-23.6826 30.843-29.6253.818-.8304 1.288-1.304 1.296-1.3055z" fill="#ec3750" mask="url(#b)" stroke="#17171d" stroke-width="6"/><path d="m127.091 44.6187c-1.695 2.4865-4.703 6.7147-9.333 11.8439-8.312 7.7619-.78 9.2777 2.965 6.1841 2.148-1.6722 4.413-3.5167 4.413-3.5167l5.077 5.1171s-1.753 2.5723-3.299 4.6566c-4.629 5.1296 1.315 6.9412 4.866 3.2105 1.718-1.9668 9.226-10.0284 12.381-14.6588 2.79-2.6158-.473-7.6215-4.892-3.3544-1.972 1.4153-5.662 4.798-5.662 4.798s-4.224-4.1537-4.193-4.3838c.034-.6052 1.255-1.6559 1.842-2.8884 3.57-8.7489-1.886-10.3521-4.165-7.0081z" fill="#fff"/><path d="m150.596 63.9066c2.963-2.4063 4.991-2.12 6.261-1.3775.555.3069.81 1.8293.902 3.223-1.376 8.2851-11.019 20.3188-12.052 20.9539-3.69 2.4891-7.145.1475-4.042-2.9393 1.686-1.9656 3.325-3.7036 3.325-3.7036l-4.609-2.7276c-7.149 5.6905-9.18 1.0445-5.763-1.2656 3.801-2.7974 12.002-8.9769 15.978-12.1633zm-5.892 8.7989 4.416 2.9713s5.123-7.8253 3.229-7.6094z" fill="#fff"/><path d="m172.852 81.0428c1.436-1.4992 1.937-6.1263-2.965-7.5249-6.683-2.9522-14.245 7.6807-14.245 7.6807s-3.653 5.1541-3.641 9.7933c-.085 4.4299 3.761 6.1764 4.467 6.6076 4.964.6546 4.779-2.9329 4.073-3.3633-.929-.4775-2.291-.9027-2.95-2.2228-1.127-2.2216.818-5.6965 2.079-7.4687 2.376-2.8649 7.293-8.4654 9.751-5.4463.808 3.2914 2.648 2.7754 3.431 1.9444z" fill="#fff"/><path d="m177.217 82.765c-2.783 3.049-3.012 7.4776-9.006 12.9676-1.449 1.3479-4.535 3.627-4.933 3.9683-3.006 2.3431-.527 5.6381 5.52 1.9021 1.433-.832 3.818-3.54 3.818-3.54l1.658.5335s-1.355 6.6915-2.208 9.4345c-.792 2.662 3.011 6.092 5.293 1.196.602-1.76 1.042-4.307 1.242-7.704 0 0 .233-2.4491-.342-3.0398 0 0 7.181-2.6988 8.516-4.4003 1.398-1.7819 1.123-3.5827-4.23-2.0581-5.351 1.5254-6.273 2.3697-6.273 2.3697s2.78-3.7092 4.096-6.8747c1.825-3.1537-.815-7.2369-3.151-4.7548z" fill="#fff"/><path d="m199.427 100.295c-2.407.9-4.849 3.525-6.843 8.263-2.918 7.099-1.83 12.423 3.477 13.851 5.309 1.428 5.752-2.667 5.35-2.989-.322-.26-.226-.721-2.597-.872-2.374-.151-3.5-1.73-3.382-5.411.102-2.48 1.482-6.767 4.035-8.359.76-.47 1.275-.46 1.566-.496 1.163-.146 1.855.815 1.953 1.026 1.721 3 3.144 1.177 3.052-1.056-.656-3.358-2.816-4.957-6.611-3.957z" fill="#fff"/><path d="m210.364 105.988c1.171-2.666 4.834-3.478 3.123 2.893-.537 4.373-4.181 11.653-3.919 12.597s4.945 1.901 6.271 2.031c1.324.132 3.215 1.595 2.218 2.532-.919 1.002-2.067.619-2.357.654s-11.18-1.445-10.684-3.502c.498-2.056.868-2.939 1.963-6.33 1.096-3.392 2.213-8.209 3.385-10.875z" fill="#fff"/><path d="m222.865 108.585c.655-2.014 3.141-2.305 3.366.275.155 1.992-1.952 9.389-1.836 12.95.251 1.533 1.767 2.473 3.015 1.731 1.636-1.234 2.832-5.619 3.756-9.154.316-1.749.405-3.156.824-4.024 1.676-2.803 3.732-1.033 3.474 2.497-.598 3.794-2.095 9.684-3.451 11.407-1.292 1.641-2.825 3.757-5.477 3.249-.684-.143-6.2-1.73-5.469-8.22.924-6.737 1.142-8.698 1.798-10.711z" fill="#fff"/><path d="m241.63 110.195c4.054-.49 6.741-.074 8.305 1.441.79 1.163.666 3.328-.344 4.784-.964 1.229-2.041 2.099-2.041 2.099 1.806 1.042 2.34 3.552 1.587 6.183-.752 2.631-4.125 3.906-9.097 3.397-1.642-.246-3.188-.948-3.029-1.487.401-1.012 2.048-14.475 2.048-14.475.208-.767.174-1.725 2.571-1.942zm.375 2.697-.088 4.456s4.57.188 5.049-2.092c.477-2.282-2.515-2.141-4.961-2.364zm-.838 7.585s-.972 5.083-.924 4.855c.112-.31 6.286 1.114 6.407-2.385.121-3.497-5.483-2.47-5.483-2.47z" fill="#fff"/></g><path d="m90 60-42 40.362 3.3788 1.505 41.1212-39.867z" fill="#17171d"/><path d="m75 72.658c.7 1.6999 7.4999 8.5999 3.7999 9.5999-3.6999.9999-2.3999 9.4998 4.9 7.5999 7.2999-1.9 9.5998-11.4999 2.5999-15.4999-6.9999-3.9999-11.2998-1.6999-11.2998-1.6999z" style="fill-rule:evenodd;clip-rule:evenodd;fill:#fff;stroke:#252429;stroke-width:3;stroke-linecap:round;stroke-linejoin:round"/><path d="m62 81.658c.7 1.6999 7.4999 8.5999 3.7999 9.5999-3.6999.9999-2.3999 9.5001 4.9 7.5999 7.2999-1.9 9.5998-11.4999 2.5999-15.4999-6.9999-3.9999-11.2998-1.6999-11.2998-1.6999z" style="fill-rule:evenodd;clip-rule:evenodd;fill:#fff;stroke:#252429;stroke-width:3;stroke-linecap:round;stroke-linejoin:round"/><path d="m49 90.658c.7 1.6999 7.4999 8.5999 3.7999 9.6-3.6998 1-2.3999 9.5 4.9001 7.6 7.2998-1.9 9.5998-11.5001 2.5998-15.5001-6.9999-3.9999-11.2998-1.6999-11.2998-1.6999z" style="fill-rule:evenodd;clip-rule:evenodd;fill:#fff;stroke:#252429;stroke-width:3;stroke-linecap:round;stroke-linejoin:round"/></g></svg>


--------------------------------------------------------------------------------
/src/styles/global.css:
--------------------------------------------------------------------------------
  1 | :root {
  2 |     --font-serif: 'Vazirmatn', serif;
  3 |     --font-sans: 'Vazirmatn', sans-serif;
  4 |     --font-mono: 'Vazir Code', monospace;
  5 |     --font-main-title: 'Vazirmatn', serif;
  6 | }
  7 | 
  8 | * {
  9 | 	box-sizing: border-box;
 10 | }
 11 | 
 12 | html {
 13 | 	background: #f8f9fa;
 14 | 	font-size: 1.1rem;
 15 | 	font-family: var(--font-serif);
 16 | 	overflow-wrap: break-word;
 17 | 	line-height: 1.8;
 18 | 	-webkit-text-size-adjust: 100%;
 19 | }
 20 | 
 21 | body {
 22 | 	margin: 0;
 23 | }
 24 | 
 25 | img, video, iframe {
 26 | 	width: 100%;
 27 | 	height: auto;
 28 | 	display: block;
 29 | }
 30 | 
 31 | h1 {
 32 | 	line-height: 1.3;
 33 | }
 34 | 
 35 | h2 {
 36 | 	line-height: 1.4;
 37 | 	margin: 0;
 38 | 	margin-top: 80px;
 39 | }
 40 | 
 41 | h3 {
 42 | 	line-height: 1.5;
 43 | 	margin-top: 60px;
 44 | }
 45 | 
 46 | h4 {
 47 | 	margin-top: 40px;
 48 | }
 49 | 
 50 | pre {
 51 | 	tab-size: 8;
 52 | }
 53 | 
 54 | code {
 55 | 	font-size: 0.9em;
 56 | 	font-family: var(--font-mono);
 57 | }
 58 | 
 59 | code:not(pre code) {
 60 | 	color: #8f310c;
 61 | 	background: #fff4e6;
 62 | 	padding: 1px 2px;
 63 | 	border-radius: 2px;
 64 | }
 65 | 
 66 | pre code {
 67 | 	font-size: 0.85em;
 68 | }
 69 | 
 70 | p, ul:not(li ul), ol:not(li ol), pre, .code-block {
 71 | 	margin: 20px 0;
 72 | }
 73 | 
 74 | .code-block {
 75 | 	direction: ltr;
 76 | }
 77 | 
 78 | blockquote {
 79 | 	background: #e9ecef;
 80 |     border-left: 4px solid #868e96;
 81 | 	margin: 30px 0;
 82 | 	padding: 10px 20px;
 83 |     padding-left: 30px;
 84 | 
 85 | 	& p, & ul:not(li ul), & ol:not(li ol) {
 86 | 		margin: 14px 0;
 87 | 	}
 88 | }
 89 | 
 90 | a {
 91 | 	--color: #6741d9;
 92 | 	--hover-background: #e5dbff;
 93 | 	color: var(--color);
 94 | 	text-decoration: none;
 95 | 	padding: 0 2px;
 96 | 	margin: 0 -2px;
 97 | 
 98 | 	&:hover {
 99 | 		background: var(--hover-background);
100 | 	}
101 | 
102 | 	&:not([href^=\#]):visited {
103 | 		--color: #9c36b5;
104 | 		--hover-background: #f3d9fa;
105 | 	}
106 | }
107 | 
108 | hr {
109 | 	border: none;
110 | 	height: 1px;
111 | 	background: #ced4da;
112 | 	border: none;
113 | 	margin: 40px 0;
114 | }
115 | 
116 | .sr-only {
117 | 	position: absolute;
118 | 	width: 1px;
119 | 	height: 1px;
120 | 	padding: 0;
121 | 	margin: -1px;
122 | 	overflow: hidden;
123 | 	clip: rect(0, 0, 0, 0);
124 | 	white-space: nowrap;
125 | 	border-width: 0;
126 | }
127 | 
128 | .big {
129 |     position: relative;
130 |     left: calc((100% - var(--width)) / 2);
131 | 	margin: 40px auto;
132 | }
133 | 
134 | .scroll-padding {
135 | 	padding-top: 60vh;
136 | 	padding-bottom: 20px;
137 | 	font-size: 0.9em;
138 | 	text-align: center;
139 | 	color: #adb5bd;
140 | 	line-height: 1.5;
141 | 
142 | 	& p {
143 | 		margin: 6px 0;
144 | 	}
145 | 
146 | 	& p:not(:first-child):not(:last-child) {
147 | 		font-style: italic;
148 | 	}
149 | 
150 | 	& a {
151 | 		--color: #b197fc;
152 | 	}
153 | 
154 | 	& a:not([href^="#"]):visited {
155 | 		--color: #da77f2;
156 | 	}
157 | 
158 | 	& hr {
159 | 		margin: 16px 0;
160 | 	}
161 | }
162 | 
163 | .content {
164 | 	width: 100%;
165 | 	max-width: 700px;
166 | 	padding: 10px;
167 | }
168 | 
169 | summary {
170 | 	cursor: default;
171 | 
172 | 	&:hover {
173 | 		color: #6741d9;
174 | 	}
175 | }
176 | 
177 | .continue {
178 | 	--color: #000000;
179 | 	--hover-background: transparent;
180 | 	border-top: 2px solid #ced4da;
181 | 	border-bottom: 2px solid #ced4da;
182 | 	padding: 8px 16px;
183 | 	margin: 0 auto;
184 | 	text-align: center;
185 | 	margin-top: 40px;
186 | 	display: block;
187 | 	width: fit-content;
188 | 	font-style: italic;
189 | 
190 | 	&:hover {
191 | 		border-color: #845ef7;
192 | 	}
193 | }
194 | 
195 | nav.external {
196 | 	font-size: 0.95em;
197 | 	width: 100%;
198 | 	position: fixed;
199 | 	top: 0;
200 | 	left: 0;
201 | 	background: #f8f9fa;
202 | 	transform: translateY(0);
203 | 	transition: transform 180ms ease-out;
204 | 	z-index: 99;
205 | 
206 | 	& ul {
207 | 		padding: 0;
208 | 		padding-top: 3px;
209 | 		padding-bottom: 4px;
210 | 		margin: 0;
211 | 		list-style-type: none;
212 | 		display: flex;
213 | 		gap: 16px;
214 | 		align-items: center;
215 | 		justify-content: center;
216 | 
217 | 		&:hover li {
218 | 			opacity: 1 !important;
219 | 		}
220 | 	}
221 | 
222 | 	& li {
223 | 		position: relative;
224 | 		transition: opacity 200ms ease-in-out;
225 | 
226 | 		&.active::after {
227 | 			content: "";
228 | 			position: absolute;
229 | 			top: calc(100% - 6px);
230 | 			left: 50%;
231 | 			transform: translateX(-50%);
232 | 			display: block;
233 | 			border: 5px solid transparent;
234 | 			border-bottom-color: #fa5252;
235 | 		}
236 | 	}
237 | 
238 | 	& a, & a:not([href^=\#]):visited {
239 | 		--color: currentColor;
240 | 		--hover-background: #dee2e6;
241 | 		display: block;
242 | 		text-align: center;
243 | 		line-height: 1.4;
244 | 		padding: 2px 6px;
245 | 
246 | 		& .chapter {
247 | 			font-size: 0.8em;
248 | 			font-weight: 400;
249 | 			color: #868e96;
250 | 		}
251 | 	}
252 | }
253 | 
254 | .old-nav {
255 | 	display: none;
256 | 
257 | 	& a {
258 | 		--color: #000000;
259 | 		--hover-background: #ced4da;
260 | 	}
261 | 
262 | 	& .active {
263 | 		font-weight: bold;
264 | 	}
265 | 
266 | 	& ol {
267 | 		margin: 5px 0;
268 | 	}
269 | }
270 | 
271 | .edit-button {
272 | 	--color: #adb5bd;
273 | 	--hover-background: #e9ecef;
274 | 	vertical-align: baseline;
275 | 	padding: 0 3px;
276 | 	margin-left: 4px;
277 | 	font-size: 0.95rem;
278 | 	font-weight: normal;
279 | 
280 | 	&:hover {
281 | 		color: #868e96;
282 | 	}
283 | }
284 | 
285 | @media (max-width: 720px) {
286 | 	.old-nav {
287 | 		display: block;
288 | 	}
289 | 
290 | 	.md-hide {
291 | 		display: none;
292 | 	}
293 | }
294 | 
295 | @media (max-width: 420px) {
296 | 	.sm-hide {
297 | 		display: none;
298 | 	}
299 | }
300 | 
301 | ::selection {
302 | 	background: #adb5bd9b;
303 | }
304 | 
305 | .orpheus-flag {
306 | 	position: absolute;
307 | 	top: 0;
308 | 	left: 20px;
309 | 	display: block;
310 | 	width: 140px;
311 | 	transform-origin: top left;
312 | 	z-index: 999;
313 | 
314 | 	& img {
315 | 		width: 100%;
316 | 	}
317 | 
318 | 	&:hover {
319 | 		background: none;
320 | 		animation: orpheus-flag-wave 0.5s linear infinite alternate;
321 | 	}
322 | }
323 | 
324 | @keyframes orpheus-flag-wave {
325 | 	0% {
326 | 		transform: rotate(0deg);
327 | 	}
328 | 	
329 | 	100% {
330 | 		transform: rotate(-5deg);
331 | 	}
332 | }
333 | 
334 | @page { 
335 |     size: auto;
336 |     margin: 0.8in;
337 | }
338 | 
339 | @media print {
340 | 	html {
341 | 		background: #ffffff;
342 | 		font-size: 0.9em;
343 | 	}
344 | 
345 | 	.orpheus-flag, nav.external, .scroll-padding, .edit-button, .continue {
346 | 		display: none;
347 | 	}
348 | 
349 | 	.content {
350 | 		max-width: none;
351 | 	}
352 | 
353 | 	h1, h2, h3, h4, h5, h6 {
354 | 		page-break-after: avoid;
355 | 		page-break-inside: avoid;
356 | 	}
357 | 
358 | 	p {
359 | 		orphans: 2;
360 | 		widows: 2;
361 | 	}
362 | 
363 | 	blockquote {
364 | 		background: none;
365 | 		border-left: 3px solid #adb5bd;
366 | 		padding: 0 8px;
367 | 		padding-left: 20px;
368 | 		page-break-inside: avoid;
369 | 	}
370 | 
371 | 	code {
372 | 		color: #000000;
373 | 	}
374 | 
375 | 	code:not(pre code) {
376 | 		color: #8f310c;
377 | 		background: none;
378 | 		padding: 0;
379 | 		border-radius: 0;
380 | 	}
381 | 	
382 | 	pre span {
383 | 		color: inherit !important;
384 | 	}
385 | 
386 | 	h2 {
387 | 		margin-top: 50px;
388 | 	}
389 | 
390 | 	hr {
391 | 		background: #ced4da;
392 | 	}
393 | 
394 | 	a {
395 | 		text-decoration: underline;
396 | 	}
397 | 
398 | 	a[href^=\#], a[href^=\/] {
399 | 		text-decoration: none;
400 | 		font-weight: bold;
401 | 		color: #000000;
402 | 
403 | 		&::before {
404 | 			content: "[";
405 | 			color: #495057;
406 | 		}
407 | 
408 | 		&::after {
409 | 			content: "]";
410 | 			color: #495057;
411 | 		}
412 | 	}
413 | }


--------------------------------------------------------------------------------
/src/content/chapters/2-slice-dat-time.mdx:
--------------------------------------------------------------------------------
 1 | ---
 2 | chapter: 2
 3 | title: Slice Dat Time
 4 | shortname: Multitasking
 5 | slug: slice-dat-time
 6 | updatedAt: 2023-08-02T18:14:02.296Z
 7 | ---
 8 | 
 9 | Let's say you're building an operating system and you want users to be able to run multiple programs at once. You don’t have a fancy multi-core processor though, so your CPU can only run one instruction at a time!
10 | 
11 | Luckily, you’re a very smart OS developer. You figure out that you can fake parallelism by letting processes take turns on the CPU. If you cycle through the processes and run a couple instructions from each one, they can all be responsive without any single process hogging the CPU.
12 | 
13 | But how do you take control back from program code to switch processes? After a bit of research, you discover that most computers come with timer chips. You can program a timer chip to trigger a switch to an OS interrupt handler after a certain amount of time passes.
14 | 
15 | ## Hardware Interrupts
16 | 
17 | Earlier, we talked about how software interrupts are used to hand control from a userland program to the OS. These are called “software” interrupts because they’re voluntarily triggered by a program — machine code executed by the processor in the normal fetch-execute cycle tells it to switch control to the kernel.
18 | 
19 | <img src='images/keyboard-hardware-interrupt.png' loading='eager' style='max-width: 500px; margin: 0 auto;' alt='A drawing illustrating how hardware interrupts break normal execution. On top: a drawing of a keyboard with a highlighted key, with a lightning bolt drawn to a CPU on the right. On the bottom: some binary labeled "program code," a similar lightning bolt, and some more binary labeled "kernel code." The lightning bolt is labeled "interrupt triggers context switch."' width='935' height='503' />
20 | 
21 | OS schedulers use *timer chips* like [PITs](https://en.wikipedia.org/wiki/Programmable_interval_timer) to trigger hardware interrupts for multitasking:
22 | 
23 | 1. Before jumping to program code, the OS sets the timer chip to trigger an interrupt after some period of time.
24 | 2. The OS switches to user mode and jumps to the next instruction of the program.
25 | 3. When the timer elapses, it triggers a hardware interrupt to switch to kernel mode and jump to OS code.
26 | 4. The OS can now save where the program left off, load a different program, and repeat the process.
27 | 
28 | This is called *preemptive multitasking*; the interruption of a process is called [*preemption*](https://en.wikipedia.org/wiki/Preemption_(computing)). If you’re, say, reading this article on a browser and listening to music on the same machine, your very own computer is probably following this exact cycle thousands of times a second.
29 | 
30 | ## Timeslice Calculation
31 | 
32 | A *timeslice* is the duration an OS scheduler allows a process to run before preempting it. The simplest way to pick timeslices is to give every process the same timeslice, perhaps in the 10&nbsp;ms range, and cycle through tasks in order. This is called *fixed timeslice round-robin* scheduling.
33 | 
34 | > **Aside: fun jargon facts!**
35 | > 
36 | > Did you know that timeslices are often called "quantums?" Now you do, and you can impress all your tech friends. I think I deserve heaps of praise for not saying quantum in every other sentence in this article.
37 | > 
38 | > Speaking of timeslice jargon, Linux kernel devs use the [jiffy](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/jiffies.h) time unit to count fixed frequency timer ticks. Among other things, jiffies are used for measuring the lengths of timeslices. Linux's jiffy frequency is typically 1000 Hz but can be configured when compiling the kernel.
39 | 
40 | A slight improvement to fixed timeslice scheduling is to pick a *target latency* — the ideal longest time for a process to respond. The target latency is the time it takes for a process to resume execution after being preempted, assuming a reasonable number of processes. *This is pretty hard to visualize! Don't worry, a diagram is coming soon.*
41 | 
42 | Timeslices are calculated by dividing the target latency by the total number of tasks; this is better than fixed timeslice scheduling because it eliminates wasteful task switching with fewer processes. With a target latency of 15&nbsp;ms and 10 processes, each process would get 15/10 or 1.5&nbsp;ms to run. With only 3 processes, each process gets a longer 5&nbsp;ms timeslice while still hitting the target latency.
43 | 
44 | Process switching is computationally expensive because it requires saving the entire state of the current program and restoring a different one. Past a certain point, too small a timeslice can result in performance problems with processes switching too rapidly. It's common to give the timeslice duration a lower bound (*minimum granularity*). This does mean that the target latency is exceeded when there are enough processes for the minimum granularity to take effect.
45 | 
46 | At the time of writing this article, Linux's scheduler uses a target latency of 6&nbsp;ms and a minimum granularity of 0.75&nbsp;ms.
47 | 
48 | <img src='images/linux-scheduler-target-latency.png' loading='lazy' style='max-width: 500px; margin: 0 auto;' alt='A diagram titled "Naive Dynamic Timeslice Round-Robin Scheduling." It depicts a time series of 3 different processes getting time to execute in a repeated cycle. In between the execution blocks of each process is a much shorter block labeled "kernel scheduler." The length of each program execution block is labeled "timeslice (2ms)." The distance from the start of process 1 executing to the next start of process 1 executing, encompassing the execution time of processes 2 and 3, is labeled as "target latency (6ms)."' width='935' height='433' />
49 | 
50 | Round-robin scheduling with this basic timeslice calculation is close to what most computers do nowadays. It's still a bit naive; most operating systems tend to have more complex schedulers which take process priorities and deadlines into account. Since 2007, Linux has used a scheduler called [Completely Fair Scheduler](https://docs.kernel.org/scheduler/sched-design-CFS.html). CFS does a bunch of very fancy computer science things to prioritize tasks and divvy up CPU time.
51 | 
52 | Every time the OS preempts a process it needs to load the new program's saved execution context, including its memory environment. This is accomplished by telling the CPU to use a different *page table*, the mapping from "virtual" to physical addresses. This is also the system that prevents programs from accessing each other's memory; we'll go down this rabbit hole in chapters [5](/the-translator-in-your-computer) and [6](/lets-talk-about-forks-and-cows) of this article.
53 | 
54 | ## Note #1: Kernel Preemptability
55 | 
56 | So far, we've been only talking about the preemption and scheduling of userland processes. Kernel code might make programs feel laggy if it took too long handling a syscall or executing driver code.
57 | 
58 | Modern kernels, including Linux, are [preemptive kernels](https://en.wikipedia.org/wiki/Kernel_preemption). This means they're programmed in a way that allows kernel code itself to be interrupted and scheduled just like userland processes.
59 | 
60 | This isn't very important to know about unless you're writing a kernel or something, but basically every article I've read has mentioned it so I thought I would too! Extra knowledge is rarely a bad thing.
61 | 
62 | ## Note #2: A History Lesson
63 | 
64 | Ancient operating systems, including classic Mac OS and versions of Windows long before NT, used a predecessor to preemptive multitasking. Rather than the OS deciding when to preempt programs, the programs themselves would choose to yield to the OS. They would trigger a software interrupt to say, "hey, you can let another program run now." These explicit yields were the only way for the OS to regain control and switch to the next scheduled process.
65 | 
66 | This is called [*cooperative multitasking*](https://en.wikipedia.org/wiki/Cooperative_multitasking). It has a couple major flaws: malicious or just poorly designed programs can easily freeze the entire operating system, and it's nigh impossible to ensure temporal consistency for realtime/time-sensitive tasks. For these reasons, the tech world switched to preemptive multitasking a long time ago and never looked back.
67 | 


--------------------------------------------------------------------------------
/src/content/chapters/4-becoming-an-elf-lord.mdx:
--------------------------------------------------------------------------------
  1 | ---
  2 | chapter: 4
  3 | title: Becoming an Elf-Lord
  4 | shortname: ELF
  5 | slug: becoming-an-elf-lord
  6 | updatedAt: 2023-07-17T17:16:18.079Z
  7 | ---
  8 | 
  9 | import CodeBlock from '../../components/CodeBlock.astro'
 10 | 
 11 | We pretty thoroughly understand `execve` now. At the end of most paths, the kernel will reach a final program containing machine code for it to launch. Typically, a setup process is required before actually jumping to the code — for example, different parts of the program have to be loaded into the right places in memory. Each program needs different amounts of memory for different things, so we have standard file formats that specify how to set up a program for execution. While Linux supports many such formats, the most common format by far is *ELF* (executable and linkable format).
 12 | 
 13 | <p>
 14 | 	<img src='images/gnu-linux-elf-drawing.jpg' loading='eager' style='max-width: 260px; margin: 0 auto;' alt='A marker drawing on paper. A wizard elf is shown meditating, holding the head of a gnu in one hand and a Linux penguin in the other. The elf trails off, saying "Well, actually, Linux is just the kernel, the operating system is..." The drawing is captioned in red marker: "You&apos;ve heard of elf on a shelf! Now, get ready for... elf on a GNU/Linux." The drawing is signed "Nicky."' width='529' height='256' />
 15 | </p>
 16 | <div style='text-align: center;'>
 17 | 	<p style='margin-top: -10px;'>
 18 | 		(Thank you to <a href='https://ncase.me/' target='_blank'>Nicky Case</a> for the adorable drawing.)
 19 | 	</p>
 20 | </div>
 21 | 
 22 | > **Aside: are elves everywhere?**
 23 | > 
 24 | > When you run an app or command-line program on Linux, it's exceedingly likely that it's an ELF binary. However, on macOS the de-facto format is  [Mach-O](https://en.wikipedia.org/wiki/Mach-O) instead. Mach-O does all the same things as ELF but is structured differently. On Windows, .exe files use the [Portable Executable](https://en.wikipedia.org/wiki/Portable_Executable) format which is, again, a different format with the same concept.
 25 | 
 26 | In the Linux kernel, ELF binaries are handled by the `binfmt_elf` handler, which is more complex than many other handlers and contains thousands of lines of code. It's responsible for parsing out certain details from the ELF file and using them to load the process into memory and execute it.
 27 | 
 28 | *I ran some command-line kung fu to sort binfmt handlers by line count:*
 29 | 
 30 | <CodeBlock name='Shell session'>
 31 | ```
 32 | $ wc -l binfmt_* | sort -nr | sed 1d
 33 |     2181 binfmt_elf.c
 34 |     1658 binfmt_elf_fdpic.c
 35 |      944 binfmt_flat.c
 36 |      836 binfmt_misc.c
 37 |      158 binfmt_script.c
 38 |       64 binfmt_elf_test.c
 39 | ```
 40 | </CodeBlock>
 41 | 
 42 | ## File Structure
 43 | 
 44 | Before looking more deeply at how `binfmt_elf` executes ELF files, let's take a look at the file format itself. ELF files are typically made up of four parts:
 45 | 
 46 | <img src='images/elf-file-structure.png' loading='lazy' style='max-width: 500px; margin: 0 auto;' alt='A diagram showing an overview of the structure of ELF files, with four sequential sections. Section 1, ELF Header: basic information about the binary, and locations of PHT and SHT. Section 2, Program Header Table (PHT): describes how and where to load the ELF file&apos;s data into memory. Section 3, Section Header Table (SHT): optional "map" of the data to assist in debugging. Section 4, Data: all of the binary&apos;s data. The PHT and SHT point into this section.' width='1033' height='786' />
 47 | 
 48 | ### ELF Header
 49 | 
 50 | Every ELF file has an [ELF header](https://refspecs.linuxfoundation.org/elf/gabi4+/ch4.eheader.html). It has the very important job of conveying basic information about the binary such as:
 51 | 
 52 | - What processor it's designed to run on. ELF files can contain machine code for different processor types, like ARM and x86.
 53 | - Whether the binary is meant to be run on its own as an executable, or whether it's meant to be loaded by other programs as a "dynamically linked library." We'll go into details about what dynamic linking is soon.
 54 | - The entry point of the executable. Later sections specify exactly where to load data contained in the ELF file into memory. The entry point is a memory address pointing to where the first machine code instruction is in memory after the entire process has been loaded.
 55 | 
 56 | The ELF header is always at the start of the file. It specifies the locations of the program header table and section header, which can be anywhere within the file. Those tables, in turn, point to data stored elsewhere in the file.
 57 | 
 58 | ### Program Header Table
 59 | 
 60 | The [program header table](https://refspecs.linuxbase.org/elf/gabi4+/ch5.pheader.html) is a series of entries containing specific details for how to load and execute the binary at runtime. Each entry has a type field that says what detail it's specifying — for example, `PT_LOAD` means it contains data that should be loaded into memory, but `PT_NOTE` means the segment contains informational text that shouldn't necessarily be loaded anywhere.
 61 | 
 62 | <img src='images/elf-program-header-types.png' loading='lazy' style='max-width: 500px; margin: 0 auto;' alt='A table showing four different common program header types. Type 1, PT_LOAD: data to be loaded into memory. Type 2, PT_NOTE: freeform text like copyright notices, version info, etc.. Type 3, PT_DYNAMIC: Info about dynamic linking. Type 4, PT_INTERP: Path to the location of an "ELF interpreter."' width='904' height='338' />
 63 | 
 64 | Each entry specifies information about where its data is in the file and, sometimes, how to load the data into memory:
 65 | 
 66 | - It points to the position of its data within the ELF file.
 67 | - It can specify what virtual memory address the data should be loaded into memory at. This is typically left blank if the segment isn't meant to be loaded into memory.
 68 | - Two fields specify the length of the data: one for the length of the data in the file, and one for the length of the memory region to be created. If the memory region length is longer than the length in the file, the extra memory will be filled with zeroes. This is beneficial for programs that might want a static segment of memory to use at runtime; these empty segments of memory are typically called [BSS](https://en.wikipedia.org/wiki/.bss) segments.
 69 | - Finally, a flags field specifies what operations should be permitted if it's loaded into memory: `PF_R` makes it readable, `PF_W` makes it writable, and `PF_X` means it's code that should be allowed to execute on the CPU.
 70 | 
 71 | ### Section Header Table
 72 | 
 73 | The [section header table](https://refspecs.linuxbase.org/elf/gabi4+/ch4.sheader.html) is a series of entries containing information about *sections*. This section information is like a map, charting the data inside the ELF file. It makes it easy for [programs like debuggers](https://www.sourceware.org/gdb/) to understand the intended uses of different portions of the data.
 74 | 
 75 | <img src='images/elf-section-header-table-diagram.png' loading='lazy' style='max-width: 450px; margin: 0 auto;' alt='An old treasure map with islands, rivers, palm trees, and a compass rose. Some of the islands are labeled with ELF section names such as ".text", ".data", ".shstrtab", and ".bss". The drawing is captioned "The section header table is like a map for binary data."' width='701' height='617' />
 76 | 
 77 | For example, the program header table can specify a large swath of data to be loaded into memory together. That single `PT_LOAD` block might contain both code and global variables! There's no reason those have to be specified separately to *run* the program; the CPU just starts at the entry point and steps forward, accessing data when and where the program requests it. However, software like a debugger for *analyzing* the program needs to know exactly where each area starts and ends, otherwise it might try to decode some text that says "hello" as code (and since that isn't valid code, explode). This information is stored in the section header table.
 78 | 
 79 | While it's usually included, the section header table is actually optional. ELF files can run perfectly well with the section header table completely removed, and developers who want to hide what their code does will sometimes intentionally strip or mangle the section header table from their ELF binaries to [make them harder to decode](https://binaryresearch.github.io/2019/09/17/Analyzing-ELF-Binaries-with-Malformed-Headers-Part-1-Emulating-Tiny-Programs.html).
 80 | 
 81 | Each section has a name, a type, and some flags that specify how it's intended to be used and decoded. Standard names usually start with a dot by convention. The most common sections are:
 82 | 
 83 | - `.text`: machine code to be loaded into memory and executed on the CPU. `SHT_PROGBITS` type with the `SHF_EXECINSTR` flag to mark it as executable, and the `SHF_ALLOC` flag which means it's loaded into memory for execution. (Don't get confused by the name, it's still just binary machine code! I always found it somewhat strange that it's called `.text` despite not being readable "text.")
 84 | - `.data`: initialized data hardcoded in the executable to be loaded into memory. For example, a global variable containing some text might be in this section. If you write low-level code, this is the section where statics go. This also has the type `SHT_PROGBITS`, which just means the section contains "information for the program." Its flags are `SHF_ALLOC` and `SHF_WRITE` to mark it as writable memory.
 85 | - `.bss`: I mentioned earlier that it's common to have some allocated memory that starts out zeroed. It would be a waste to include a bunch of empty bytes in the ELF file, so a special segment type called BSS is used. It's helpful to know about BSS segments during debugging, so there's also a section header table entry that specifies the length of the memory to be allocated. It's of type `SHT_NOBITS`, and is flagged `SHF_ALLOC` and `SHF_WRITE`.
 86 | - `.rodata`: this is like `.data` except it's read-only. In a very basic C program that runs `printf("Hello, world!")`, the string "Hello world!" would be in a `.rodata` section, while the actual printing code would be in a `.text` section.
 87 | - `.shstrtab`: this is a fun implementation detail! The names of sections themselves (like `.text` and `.shstrtab`) aren't included directly in the section header table. Instead, each entry contains an offset to a location in the ELF file that contains its name. This way, each entry in the section header table can be the same size, making them easier to parse — an offset to the name is a fixed-size number, whereas including the name in the table would use a variable-size string. All of this name data is stored in its own section called `.shstrtab`, of type `SHT_STRTAB`.
 88 | 
 89 | ### Data
 90 | 
 91 | The program and section header table entries all point to blocks of data within the ELF file, whether to load them into memory, to specify where program code is, or just to name sections. All of these different pieces of data are contained in the data section of the ELF file.
 92 | 
 93 | <img src='images/elf-data-section.png' loading='lazy' style='max-width: 680px;' alt='A diagram demonstrating how different parts of the ELF file reference locations within the data block. A continuous collection of data is depicted, fading out at the end, containing some clearly recognizable things such as the path to an ELF interpreter, the section title ".rodata", and the string "Hello, world!" A couple example ELF sections float above the data block, with arrows pointing to their data. For example, the data sections from both the PHT and SHT entry examples point to the same "Hello, world!" text. The SHT entry&apos;s label is also stored in the data block.' width='1210' height='386' />
 94 | 
 95 | ## A Brief Explanation of Linking 
 96 | 
 97 | Back to the `binfmt_elf` code: the kernel cares about two types of entries in the program header table.
 98 | 
 99 | `PT_LOAD` segments specify where all the program data, like the `.text` and `.data` sections, need to be loaded into memory. The kernel reads these entries from the ELF file to load the data into memory so the program can be executed by the CPU.
100 | 
101 | The other type of program header table entry that the kernel cares about is `PT_INTERP`, which specifies a "dynamic linking runtime."
102 | 
103 | Before we talk about what dynamic linking is, let's talk about "linking" in general. Programmers tend to build their programs on top of libraries of reusable code — for example, libc, which we talked about earlier. When turning your source code into an executable binary, a program called a linker resolves all these references by finding the library code and copying it into the binary. This process is called *static linking*, which means external code is included directly in the file that's distributed.
104 | 
105 | However, some libraries are super common. You'll find libc is used by basically every program under the sun, since it's the canonical interface for interacting with the OS through syscalls. It would be a terrible use of space to include a separate copy of libc in every single program on your computer. Also, it might be nice if bugs in libraries could be fixed in one place rather than having to wait for each program that uses the library to be updated. Dynamic linking is the solution to these problems.
106 | 
107 | If a statically linked program needs a function `foo` from a library called `bar`, the program would include a copy of the entirety of `foo`. However, if it's dynamically linked it would only include a reference saying "I need `foo` from library `bar`." When the program is run, `bar` is hopefully installed on the computer and the `foo` function's machine code can be loaded into memory on-demand. If the computer's installation of the `bar` library is updated, the new code will be loaded the next time the program runs without needing any change in the program itself.
108 | 
109 | <img src='images/static-vs-dynamic-linking.png' loading='lazy' alt='A diagram showing the difference between static and dynamic linking. On the left, static linking is shown with the contents of some code called "foo" being separately copied into two programs. This is accompanied with text saying that library functions are copied from the developer&apos;s computer into each binary at built time. On the right side, dynamic linking is shown: each program contains the name of the "foo" function, with arrows pointing outside the programs into the foo program lying on the user&apos;s computer. This is paired with accompanying text stating that binaries reference the names of library functions, which are loaded from the user&apos;s computer at runtime.' width='1800' height='860' class='big' style='--max-width: 900px;' />
110 | 
111 | ## Dynamic Linking in the Wild
112 | 
113 | On Linux, dynamically linkable libraries like `bar` are typically packaged into files with the .so (Shared Object) extension. These .so files are ELF files just like programs — you may recall that the ELF header includes a field to specify whether the file is an executable or a library. In addition, shared objects have a `.dynsym` section in the section header table which contains information on what symbols are exported from the file and can be dynamically linked to.
114 | 
115 | On Windows, libraries like `bar` are packaged into .dll (**d**ynamic **l**ink **l**ibrary) files. macOS uses the .dylib (**dy**namically linked **lib**rary) extension. Just like macOS apps and Windows .exe files, these are formatted slightly differently from ELF files but are the same concept and technique.
116 | 
117 | An interesting distinction between the two types of linking is that with static linking, only the portions of the library that are used are included in the executable and thus loaded into memory. With dynamic linking, the *entire library* is loaded into memory. This might initially sound less efficient, but it actually allows modern operating systems to save *more* space by loading a library into memory once and then sharing that code between processes. Only code can be shared as the library needs different state for different programs, but the savings can still be on the order of tens to hundreds of megabytes of RAM.
118 | 
119 | ## Execution
120 | 
121 | Let's hop on back to the kernel running ELF files: if the binary it's executing is dynamically linked, the OS can't just jump to the binary's code right away because there would be missing code — remember, dynamically linked programs only have references to the library functions they need!
122 | 
123 | To run the binary, the OS needs to figure out what libraries are needed, load them, replace all the named pointers with actual jump instructions, and *then* start the actual program code. This is very complex code that interacts deeply with the ELF format, so it's usually a standalone program rather than part of the kernel. ELF files specify the path to the program they want to use (typically something like `/lib64/ld-linux-x86-64.so.2`) in a `PT_INTERP` entry in the program header table.
124 | 
125 | After reading the ELF header and scanning through the program header table, the kernel can set up the memory structure for the new program. It starts by loading all `PT_LOAD` segments into memory, populating the program's static data, BSS space, and machine code. If the program is dynamically linked, the kernel will have to execute the [ELF interpreter](https://unix.stackexchange.com/questions/400621/what-is-lib64-ld-linux-x86-64-so-2-and-why-can-it-be-used-to-execute-file) (`PT_INTERP`), so it also loads the interpreter's data, BSS, and code into memory.
126 | 
127 | Now the kernel needs to set the instruction pointer for the CPU to restore when returning to userland. If the executable is dynamically linked, the kernel sets the instruction pointer to the start of the ELF interpreter's code in memory. Otherwise, the kernel sets it to the start of the executable.
128 | 
129 | The kernel is almost ready to return from the syscall (remember, we're still in `execve`). It pushes the `argc`, `argv`, and environment variables to the stack for the program to read when it begins.
130 | 
131 | The registers are now cleared. Before handling a syscall, the kernel stores the current value of registers to the stack to be restored when switching back to user space. Before returning to user space, the kernel zeroes this part of the stack.
132 | 
133 | Finally, the syscall is over and the kernel returns to userland. It restores the registers, which are now zeroed, and jumps to the stored instruction pointer. That instruction pointer is now the starting point of the new program (or the ELF interpreter) and the current process has been replaced!
134 | 


--------------------------------------------------------------------------------
/src/content/chapters/1-the-basics.mdx:
--------------------------------------------------------------------------------
  1 | ---
  2 | chapter: 1
  3 | title: مقدمات
  4 | shortname: مقدمات
  5 | slug: the-basics
  6 | updatedAt: 2023-07-19T18:57:54.630Z
  7 | ---
  8 | 
  9 | یه چیزی که موقع نوشتن این کتاب منو بارها و بارها شگفت‌زده کرد این بود که کامپیوترها چقدر ساده‌ان. هنوزم برام سخته که ذهنمو درگیر نکنم و انتظار پیچیدگی و انتزاع بیشتری نداشته باشم. اگه نکته‌ای وجود داره که قبل از ادامه دادن باید توی ذهنت حک کنی اینه که هر چیزی که ساده به نظر می‌رسه، واقعا به همون سادگیه. سادگی خیلی قشنگه و بعضی وقت‌ها هم خیلی...خیلی رو اعصابه.
 10 | 
 11 | بیاین از پایه‌ای‌ترین بخش کارکرد کامپیوتر توی عمیق‌ترین قسمتش شروع کنیم.
 12 | 
 13 | ## کامپیوترها چطوری طراحی شدن؟
 14 | 
 15 | *واحد پردازش مرکزی* (CPU) توی کامپیوتر مسئول انجام همه‌ی محاسباته. همون رئیس بزرگه، جادوگر بزرگ. از لحظه‌ای که کامپیوتر رو روشن می‌کنی شروع می‌کنه به کار کردن و دستورات رو پشت سر همدیگه یکی‌یکی اجرا می‌کنه.
 16 | 
 17 | اولین CPUیی که به تولید انبوه رسید، مدل Intel 4004 بود ک اواخر دهه ۶۰ توسط فیزیکدان و مهندس ایتالیایی به نام فدریکو فاگین طراحی شد. برخلاف سیستم‌های ۶۴ بیتی که ما امروز استفاده می‌کنیم، این پردازنده معماری ۴ بیتی داشت و از پیچیدگی کمتری نسبت به پردازنده‌های مدرن امروزی برخوردار بود اما بخش زیادی از سادگی طراحی اون هنوز توی پردازنده‌های امروزی ما دیده می‌شه.
 18 | 
 19 | «دستوراتی» که CPU اجرا می‌کنه، فقط داده‌های باینری هستن: یک یا دو بایت به مشخص کردن اینکه چه دستوری باید اجرا بشه (opcode) اختصاص داره و بعدش هم هر داده‌ای که برای اجرای اون دستور لازمه. چیزی که بهش می‌گیم کد ماشین، فقط یه سری دستور باینریه که پشت سر هم قرار گرفتن. اسمبلی هم یه زبان کمکیه که باعث می‌شه خوندن و نوشتن کد ماشین برای ما آدما راحت‌تر از کار کردن با بیت‌های خام باشه. وقتی کد اسمبلی می‌نویسیم هم در نهایت همیشه به همون کد باینری تبدیل می‌شه که CPU بلده بخونه.
 20 | 
 21 | <img src='images/assembly-to-machine-code-translation.png' loading='eager' style='max-width: 400px;' alt='A diagram demonstrating how machine code translates to assembly and back. A bidirectional arrow connects three examples: Machine Code (Binary) followed by 3 bytes of binary numbers, Machine Code (Hex) followed by those 3 bytes translated to hex (0x83, 0xC3, 0x0A), and Assembly followed by "add ebx, 10". The Assembly and Machine Code are color-coded so it is clear that each byte of the machine code translate to one word in the assembly.' width='935' height='505' />
 22 | 
 23 | > نکته: دستورها همیشه به‌صورت یک به یک توی کد ماشین تبدیل نمی‌شن، مثل مثالی که بالا دیدی. مثلاً دستور اسمبلی `add eax, 512` به این کد تبدیل می‌شه: `05 00 02 00 00`.
 24 | > 
 25 | > بایت اول (`05`) یه opcode خاصه که مشخصاً به دستور اضافه کردن یه عدد ۳۲ بیتی به رجیستر EAX اشاره داره. بقیه بایت‌ها عدد ۵۱۲ (یا `0x200`) هستن که به صورت little-endian ذخیره شدن.
 26 | >
 27 | > سایت Defuse Security یه ابزار مفید ساخته برای تبدیل کد اسمبلی و کد ماشین بهمدیگه که می‌تونید ازش استفاده کنید.
 28 | 
 29 | RAM is your computer's main memory bank, a large multi-purpose space which stores all the data used by programs running on your computer. That includes the program code itself as well as the code at the core of the operating system. The CPU always reads machine code directly from RAM, and code can't be run if it isn't loaded into RAM.
 30 | 
 31 | The CPU stores an *instruction pointer* which points to the location in RAM where it's going to fetch the next instruction. After executing each instruction, the CPU moves the pointer and repeats. This is the *fetch-execute cycle*.
 32 | 
 33 | <img src='images/fetch-execute-cycle.png' loading='lazy' style='max-width: 360px; margin: 0 auto;' alt='A diagram demonstrating the fetch-execute cycle. There are two bubbles of text. The first is labeled "Fetch" and has the text "Read instruction from memory at the current instruction pointer." The second is titled "Execute" and has the text "Run the instruction and then move the instruction pointer." The fetch bubble has an arrow pointing to the execute bubble, and the execute bubble has an arrow pointing back to the fetch bubble, implying a repeated process.' width='848' height='458' />
 34 | 
 35 | After executing an instruction, the pointer moves forward to immediately after the instruction in RAM so that it now points to the next instruction. That's why code runs! The instruction pointer just keeps chugging forward, executing machine code in the order in which it has been stored in memory. Some instructions can tell the instruction pointer to jump somewhere else instead, or jump different places depending on a certain condition; this makes reusable code and conditional logic possible.
 36 | 
 37 | This instruction pointer is stored in a [*register*](https://en.wikipedia.org/wiki/Processor_register). Registers are small storage buckets that are extremely fast for the CPU to read and write to. Each CPU architecture has a fixed set of registers, used for everything from storing temporary values during computations to configuring the processor.
 38 | 
 39 | Some registers are directly accessible from machine code, like `ebx` in the earlier diagram.
 40 | 
 41 | Other registers are only used internally by the CPU, but can often be updated or read using specialized instructions. One example is the instruction pointer, which can't be read directly but can be updated with, for example, a jump instruction.
 42 | 
 43 | ## Processors Are Naive
 44 | 
 45 | Let's go back to the original question: what happens when you run an executable program on your computer? First, a bunch of magic happens to get ready to run it — we’ll work through all of this later — but at the end of the process there’s machine code in a file somewhere. The operating system loads this into RAM and instructs the CPU to jump the instruction pointer to that position in RAM. The CPU continues running its fetch-execute cycle as usual, so the program begins executing!
 46 | 
 47 | (This was one of those psyching-myself-out moments for me — seriously, this is how the program you are using to read this article is running! Your CPU is fetching your browser's instructions from RAM in sequence and directly executing them, and they're rendering this article.)
 48 | 
 49 | <img src='images/instruction-pointer.png' loading='lazy' style='max-width: 400px;' alt='A diagram depicting a series of bytes of machine code in RAM. A highlighted byte is pointed to by an arrow labeled "Instruction Pointer," and there are arrows representing how the instruction pointer moves forward in RAM.' width='935' height='372' />
 50 | 
 51 | It turns out CPUs have a super basic worldview; they only see the current instruction pointer and a bit of internal state. Processes are entirely operating system abstractions, not something CPUs natively understand or keep track of.
 52 | 
 53 | *\*waves hands\* processes are abstractions made up by ~~os devs~~ big byte to sell more computers*
 54 | 
 55 | For me, this raises more questions than it answers:
 56 | 
 57 | 1. If the CPU doesn’t know about multiprocessing and just executes instructions sequentially, why doesn’t it get stuck inside whatever program it’s running? How can multiple programs run at once?
 58 | 2. If programs run directly on the CPU, and the CPU can directly access RAM, why can't code access memory from other processes, or, god forbid, the kernel?
 59 | 3. Speaking of which, what's the mechanism that prevents every process from running any instruction and doing anything to your computer? AND WHAT'S A DAMN SYSCALL?
 60 | 
 61 | The question about memory deserves its own section and is covered in [chapter 5](/the-translator-in-your-computer) — the TL;DR is that most memory accesses actually go through a layer of misdirection that remaps the entire address space. For now, we're going to pretend that programs can access all RAM directly and computers can only run one process at once. We'll explain away both of these assumptions in time.
 62 | 
 63 | It's time to leap through our first rabbit hole into a land filled with syscalls and security rings.
 64 | 
 65 | > **Aside: what is a kernel, btw?**
 66 | > 
 67 | > Your computer's operating system, like macOS, Windows, or Linux, is the collection of software that runs on your computer and makes all the basic stuff work. "Basic stuff" is a really general term, and so is "operating system" — depending on who you ask, it can include such things as the apps, fonts, and icons that come with your computer by default.
 68 | > 
 69 | > The kernel, however, is the core of the operating system. When you boot up your computer, the instruction pointer starts at a program somewhere. That program is the kernel. The kernel has near-full access to your computer's memory, peripherals, and other resources, and is in charge of running software installed on your computer (known as userland programs). We'll learn about how the kernel has this access — and how userland programs don't — over the course of this article.
 70 | >
 71 | > Linux is just a kernel and needs plenty of userland software like shells and display servers to be usable. The kernel in macOS is called [XNU](https://en.wikipedia.org/wiki/XNU) and is Unix-like, and the modern Windows kernel is called the [NT Kernel](https://en.wikipedia.org/wiki/Architecture_of_Windows_NT).
 72 | 
 73 | ## Two Rings to Rule Them All
 74 | 
 75 | The *mode* (sometimes called privilege level or ring) a processor is in controls what it's allowed to do. Modern architectures have at least two options: kernel/supervisor mode and user mode. While an architecture might support more than two modes, only kernel mode and user mode are commonly used these days.
 76 | 
 77 | In kernel mode, anything goes: the CPU is allowed to execute any supported instruction and access any memory. In user mode, only a subset of instructions is allowed, I/O and memory access is limited, and many CPU settings are locked. Generally, the kernel and drivers run in kernel mode while applications run in user mode.
 78 | 
 79 | Processors start in kernel mode. Before executing a program, the kernel initiates the switch to user mode.
 80 | 
 81 | <img src='images/kernel-mode-vs-user-mode.png' loading='lazy' style='max-width: 500px; margin: 0 auto;' alt='Two fake iMessage screenshots demonstrating the different between user and kernel mode protections. The first, labeled Kernel Mode: right side says "Read this protected memory!", left side replies "Here you go, dear :)". The second, labeled User Mode: right side says "Read this protected memory!", left side replies "No! Segmentation fault!"' width='1072' height='433' />
 82 | 
 83 | An example of how processor modes manifest in a real architecture: on x86-64, the current privilege level (CPL) can be read from a register called `cs` (code segment). Specifically, the CPL is contained in the two [least significant bits](https://en.wikipedia.org/wiki/Bit_numbering) of the `cs` register. Those two bits can store x86-64's four possible rings: ring 0 is kernel mode and ring 3 is user mode. Rings 1 and 2 are designed for running drivers but are only used by a handful of older niche operating systems. If the CPL bits are `11`, for example, the CPU is running in ring 3: user mode.
 84 |  
 85 | ## What Even is a Syscall?
 86 | 
 87 | Programs run in user mode because they can't be trusted with full access to the computer. User mode does its job, preventing access to most of the computer — but programs need to be able to access I/O, allocate memory, and interact with the operating system *somehow*! To do so, software running in user mode has to ask the operating system kernel for help. The OS can then implement its own security protections to prevent programs from doing anything malicious.
 88 | 
 89 | If you've ever written code that interacts with the OS, you'll probably recognize functions like `open`, `read`, `fork`, and `exit`. Below a couple of layers of abstraction, these functions all use *system calls* to ask the OS for help. A system call is a special procedure that lets a program start a transition from user space to kernel space, jumping from the program's code into OS code.
 90 | 
 91 | User space to kernel space control transfers are accomplished using a processor feature called [*software interrupts*](https://en.wikipedia.org/wiki/Interrupt#Software_interrupts):
 92 | 
 93 | 1. During the boot process, the operating system stores a table called an [*interrupt vector table*](https://en.wikipedia.org/wiki/Interrupt_vector_table) (IVT; x86-64 calls this the [interrupt descriptor table](https://en.wikipedia.org/wiki/Interrupt_descriptor_table)) in RAM and registers it with the CPU. The IVT maps interrupt numbers to handler code pointers.
 94 | 
 95 |   <img src='images/interrupt-vector-table.png' loading='lazy' style='max-width: 300px; margin: 0 auto;' alt='A image of a table captioned "Interrupt Vector Table". The first column, labeled with a number sign, has a series of numbers starting at 01 and going to 04. The corresponding second column of the table, labeled "Handler Address", contains a random 8-byte-long hex number per entry. The bottom of the table has the text "So on and such forth..."' width='555' height='463' />
 96 | 
 97 | 2. Then, userland programs can use an instruction like [INT](https://www.felixcloutier.com/x86/intn:into:int3:int1) which tells the processor to look up the given interrupt number in the IVT, switch to kernel mode, and then jump the instruction pointer to the memory address stored in the IVT.
 98 | 
 99 | When this kernel code finishes, it uses an instruction like [IRET](https://www.felixcloutier.com/x86/iret:iretd:iretq) to tell the CPU to switch back to user mode and return the instruction pointer to where it was when the interrupt was triggered.
100 | 
101 | (If you were curious, the interrupt ID used for system calls on Linux is `0x80`. You can read a list of Linux system calls on [Michael Kerrisk's online manpage directory](https://man7.org/linux/man-pages/man2/syscalls.2.html).)
102 | 
103 | ### Wrapper APIs: Abstracting Away Interrupts
104 | 
105 | Here's what we know so far about system calls:
106 | 
107 | - User mode programs can't access I/O or memory directly. They have to ask the OS for help interacting with the outside world.
108 | - Programs can delegate control to the OS with special machine code instructions like INT and IRET.
109 | - Programs can't directly switch privilege levels; software interrupts are safe because the processor has been preconfigured *by the OS* with where in the OS code to jump to. The interrupt vector table can only be configured from kernel mode.
110 | 
111 | Programs need to pass data to the operating system when triggering a syscall; the OS needs to know which specific system call to execute alongside any data the syscall itself needs, for example, what filename to open. The mechanism for passing this data varies by operating system and architecture, but it's usually done by placing data in certain registers or on the stack before triggering the interrupt.
112 | 
113 | The variance in how system calls are called across devices means it would be wildly impractical for programmers to implement system calls themselves for every program. This would also mean operating systems couldn't change their interrupt handling for fear of breaking every program that was written to use the old system. Finally, we typically don't write programs in raw assembly anymore — programmers can't be expected to drop down to assembly any time they want to read a file or allocate memory.
114 | 
115 | <img src='images/syscall-architecture-differences.png' loading='lazy' style='max-width: 650px; margin: 0 auto;' alt='A drawing captioned "System calls are implemented differently across architectures." On the left is a smiling CPU receiving some binary and spitting out a filename, file.txt. Separated on the right is a different CPU receiving the same binary data but with a confused and nauseous facial expression.' width='1057' height='360' />
116 | 
117 | So, operating systems provide an abstraction layer on top of these interrupts. Reusable higher-level library functions that wrap the necessary assembly instructions are provided by [libc](https://www.gnu.org/software/libc/) on Unix-like systems and part of a library called [ntdll.dll](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/libraries-and-headers) on Windows. Calls to these library functions themselves don't cause switches to kernel mode, they're just standard function calls. Inside the libraries, assembly code does actually transfer control to the kernel, and is a lot more platform-dependent than the wrapping library subroutine.
118 | 
119 | When you call `exit(1)` from C running on a Unix-like system, that function is internally running machine code to trigger an interrupt, after placing the system call's opcode and arguments in the right registers/stack/whatever. Computers are so cool!
120 | 
121 | ## The Need for Speed / Let's Get CISC-y
122 | 
123 | Many [CISC](https://en.wikipedia.org/wiki/Complex_instruction_set_computer) architectures like x86-64 contain instructions designed for system calls, created due to the prevalence of the system call paradigm.
124 | 
125 | Intel and AMD managed not to coordinate very well on x86-64; it actually has *two* sets of optimized system call instructions. [SYSCALL](https://www.felixcloutier.com/x86/syscall.html) and [SYSENTER](https://www.felixcloutier.com/x86/sysenter) are optimized alternatives to instructions like `INT 0x80`. Their corresponding return instructions, [SYSRET](https://www.felixcloutier.com/x86/sysret.html) and [SYSEXIT](https://www.felixcloutier.com/x86/sysexit), are designed to transition quickly back to user space and resume program code.
126 | 
127 | (AMD and Intel processors have slightly different compatibility with these instructions. `SYSCALL` is generally the best option for 64-bit programs, while `SYSENTER` has better support with 32-bit programs.)
128 | 
129 | Representative of the style, [RISC](https://en.wikipedia.org/wiki/Reduced_instruction_set_computer) architectures tend not to have such special instructions. AArch64, the RISC architecture Apple Silicon is based on, uses only [one interrupt instruction](https://developer.arm.com/documentation/ddi0596/2021-12/Base-Instructions/SVC--Supervisor-Call-) for syscalls and software interrupts alike. I think Mac users are doing fine&nbsp;:)
130 | 
131 | ---
132 | 
133 | Whew, that was a lot! Let's do a brief recap:
134 | 
135 | - Processors execute instructions in an infinite fetch-execute loop and don't have any concept of operating systems or programs. The processor's mode, usually stored in a register, determines what instructions may be executed. Operating system code runs in kernel mode and switches to user mode to run programs.
136 | - To run a binary, the operating system switches to user mode and points the processor to the code's entry point in RAM. Because they only have the privileges of user mode, programs that want to interact with the world need to jump to OS code for help. System calls are a standardized way for programs to switch from user mode to kernel mode and into OS code.
137 | - Programs typically use these syscalls by calling shared library functions. These wrap machine code for either software interrupts or architecture-specific syscall instructions that transfer control to the OS kernel and switch rings. The kernel does its business and switches back to user mode and returns to the program code.
138 | 
139 | Let’s figure out how to answer my first question from earlier:
140 | 
141 | > If the CPU doesn't keep track of more than one process and just executes instruction after instruction, why doesn't it get stuck inside whatever program it's running? How can multiple programs run at once?
142 | 
143 | The answer to this, my dear friend, is also the answer to why Coldplay is so popular... clocks! (Well, technically timers. I just wanted to shoehorn that joke in.)
144 | 


--------------------------------------------------------------------------------
/src/content/chapters/6-lets-talk-about-forks-and-cows.mdx:
--------------------------------------------------------------------------------
  1 | ---
  2 | chapter: 6
  3 | title: Let's Talk About Forks and Cows
  4 | shortname: Fork-Exec
  5 | slug: lets-talk-about-forks-and-cows
  6 | updatedAt: 2023-07-17T17:16:18.079Z
  7 | ---
  8 | 
  9 | import CodeBlock from '../../components/CodeBlock.astro'
 10 | 
 11 | The final question: how did we get here? Where do the first processes come from?
 12 | 
 13 | This article is almost done. We're on the final stretch. About to hit a home run. Moving on to greener pastures. And various other terrible idioms that mean you are a single *Length of Chapter 6* away from touching grass or whatever you do with your time when you aren't reading 15,000 word articles about CPU architecture.
 14 | 
 15 | If `execve` starts a new program by replacing the current process, how do you start a new program separately, in a new process? This is a pretty important ability if you want to do multiple things on your computer; when you double-click an app to start it, the app opens separately while the program you were previously on continues running.
 16 | 
 17 | The answer is another system call: `fork`, the system call fundamental to all multiprocessing. `fork` is quite simple, actually — it clones the current process and its memory, leaving the saved instruction pointer exactly where it is, and then allows both processes to proceed as usual. Without intervention, the programs continue to run independently from each other and all computation is doubled.
 18 | 
 19 | The newly running process is referred to as the "child," with the process originally calling `fork` the "parent." Processes can call `fork` multiple times, thus having multiple children. Each child is numbered with a *process ID* (PID), starting with 1.
 20 | 
 21 | Cluelessly doubling the same code is pretty useless, so `fork` returns a different value on the parent vs the child. On the parent, it returns the PID of the new child process, while on the child it returns 0. This makes it possible to do different work on the new process so that forking is actually helpful.
 22 | 
 23 | <CodeBlock name='main.c'>
 24 | ```c
 25 | pid_t pid = fork();
 26 | 
 27 | // Code continues from this point as usual, but now across
 28 | // two "identical" processes.
 29 | //
 30 | // Identical... except for the PID returned from fork!
 31 | //
 32 | // This is the only indicator to either program that they
 33 | // are not one of a kind.
 34 | 
 35 | if (pid == 0) {
 36 | 	// We're in the child.
 37 | 	// Do some computation and feed results to the parent!
 38 | } else {
 39 | 	// We're in the parent.
 40 | 	// Probably continue whatever we were doing before.
 41 | }
 42 | ```
 43 | </CodeBlock>
 44 | 
 45 | Process forking can be a bit hard to wrap your head around. From this point on I will assume you've figured it out; if you have not, check out [this hideous-looking website](https://www.csl.mtu.edu/cs4411.ck/www/NOTES/process/fork/create.html) for a pretty good explainer.
 46 | 
 47 | Anyways, Unix programs launch new programs by calling `fork` and then immediately running `execve` in the child process. This is called the *fork-exec pattern*. When you run a program, your computer executes code similar to the following:
 48 | 
 49 | <CodeBlock name='launcher.c'>
 50 | ```c
 51 | pid_t pid = fork();
 52 | 
 53 | if (pid == 0) {
 54 | 	// Immediately replace the child process with the new program.
 55 | 	execve(...);
 56 | }
 57 | 
 58 | // Since we got here, the process didn't get replaced. We're in the parent!
 59 | // Helpfully, we also now have the PID of the new child process in the PID
 60 | // variable, if we ever need to kill it.
 61 | 
 62 | // Parent program continues here...
 63 | ```
 64 | </CodeBlock>
 65 | 
 66 | ## Mooooo!
 67 | 
 68 | You might've noticed that duplicating a process's memory only to immediately discard all of it when loading a different program sounds a bit inefficient. Luckily, we have an MMU. Duplicating data in physical memory is the slow part, not duplicating page tables, so we simply *don't* duplicate any RAM: we create a copy of the old process's page table for the new process and keep the mapping pointing to the same underlying physical memory.
 69 | 
 70 | But the child process is supposed to be independent and isolated from the parent! It's not okay for the child to write to the parent's memory, or vice versa!
 71 | 
 72 | Introducing *COW* (copy on write) pages. With COW pages, both processes read from the same physical addresses as long as they don't attempt to write to the memory. As soon as one of them tries to write to memory, that page is copied in RAM. COW pages allow both processes to have memory isolation without an upfront cost of cloning the entire memory space. This is why the fork-exec pattern is efficient; since none of the old process's memory is written to before loading a new binary, no memory copying is necessary.
 73 | 
 74 | COW is implemented, like many fun things, with paging hacks and hardware interrupt handling. After `fork` clones the parent, it flags all of the pages of both processes as read-only. When a program writes to memory, the write fails because the memory is read-only. This triggers a segfault (the hardware interrupt kind) which is handled by the kernel. The kernel which duplicates the memory, updates the page to allow writing, and returns from the interrupt to reattempt the write.
 75 | 
 76 | > *A: Knock, knock!  
 77 | > B: Who's there?  
 78 | > A: Interrupting cow.  
 79 | > B: Interrupting cow wh —  
 80 | > A: **MOOOOO!***
 81 | 
 82 | ## In the Beginning (Not Genesis 1:1)
 83 | 
 84 | Every process on your computer was fork-execed by a parent program, except for one: the *init process*. The init process is set up manually, directly by the kernel. It is the first userland program to run and the last to be killed at shutdown.
 85 | 
 86 | Want to see a cool instant blackscreen? If you're on macOS or Linux, save your work, open a terminal, and kill the init process (PID 1):
 87 | 
 88 | <CodeBlock name='Shell session'>
 89 | ```
 90 | $ sudo kill 1
 91 | ```
 92 | </CodeBlock>
 93 | 
 94 | > *Author's note: knowledge about init processes, unfortunately, only applies to Unix-like systems like macOS and Linux. Most of what you learn from now on will not apply to understanding Windows, which has a very different kernel architecture.*
 95 | > 
 96 | > *Just like the section on `execve`, I am explicitly addressing this — I could write another entire article on the NT kernel, but I am holding myself back from doing so. (For now.)*
 97 | 
 98 | The init process is responsible for spawning all of the programs and services that make up your operating system. Many of those, in turn, spawn their own services and programs.
 99 | 
100 | <img src='images/init-process-tree.png' loading='eager' style='max-width: 580px; margin: 0 auto;' alt='A tree of processes. The root node is labeled "init." All child nodes are unlabeled but implied to be spawned by the init process.' width='1400' height='752' />
101 | 
102 | Killing the init process kills all of its children and all of their children, shutting down your OS environment.
103 | 
104 | ## Back to the Kernel
105 | 
106 | We had a lot of fun looking at Linux kernel code [back in chapter 3](/how-to-run-a-program), so we're gonna do some more of that! This time we'll start with a look at how the kernel starts the init process.
107 | 
108 | Your computer boots up in a sequence like the following:
109 | 
110 | 1. The motherboard is bundled with a tiny piece of software that searches your connected disks for a program called a *bootloader*. It picks a bootloader, loads its machine code into RAM, and executes it.
111 | 	
112 | 	Keep in mind that we are not yet in the world of a running OS. Until the OS kernel starts an init process, multiprocessing and syscalls don’t really exist. In the pre-init context, "executing" a program means directly jumping to its machine code in RAM without expectation of return.
113 | 2. The bootloader is responsible for finding a kernel, loading it into RAM, and executing it. Some bootloaders, like [GRUB](https://www.gnu.org/software/grub/), are configurable and/or let you select between multiple operating systems. BootX and Windows Boot Manager are the built-in bootloaders of macOS and Windows, respectively.
114 | 3. The kernel is now running and begins a large routine of initialization tasks including setting up interrupt handlers, loading drivers, and creating the initial memory mapping. Finally, the kernel switches the privilege level to user mode and starts the init program.
115 | 4. We're finally in userland in an operating system! The init program begins running init scripts, starting services, and executing programs like the shell/UI.
116 | 
117 | ### Initializing Linux
118 | 
119 | On Linux, the bulk of step 3 (kernel initialization) occurs in the `start_kernel` function in [init/main.c](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c). This function is over 200 lines of calls to various other init functions, so I won't include [the whole thing](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L880-L1091) in this article, but I do recommend scanning through it! At the end of `start_kernel` a function named `arch_call_rest_init` is called:
120 | 
121 | <CodeBlock name='start_kernel @ init/main.c' startLine={1087} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L1087-L1088'>
122 | ```c
123 | 	/* Do the rest non-__init'ed, we're now alive */
124 | 	arch_call_rest_init();
125 | ```
126 | </CodeBlock>
127 | 
128 | > **What does non-\_\_init'ed mean?**
129 | >
130 | > The `start_kernel` function is defined as `asmlinkage __visible void __init __no_sanitize_address start_kernel(void)`. The weird keywords like `__visible`, `__init`, and `__no_sanitize_address` are all C preprocessor macros used in the Linux kernel to add various code or behaviors to a function.
131 | > 
132 | > In this case, `__init` is a macro that instructs the kernel to free the function and its data from memory as soon as the boot process is completed, simply to save space.
133 | >
134 | > How does it work? Without getting too deep into the weeds, the Linux kernel is itself packaged as an ELF file. The `__init` macro expands to `__section(".init.text")`, which is a compiler directive to place the code in a section called `.init.text` instead of the usual `.text` section. Other macros allow data and constants to be placed in special init sections as well, such as `__initdata` that expands to `__section(".init.data")`.
135 | 
136 | `arch_call_rest_init` is nothing but a wrapper function:
137 | 
138 | <CodeBlock name='init/main.c' startLine={832} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L832-L835'>
139 | ```c
140 | void __init __weak arch_call_rest_init(void)
141 | {
142 | 	rest_init();
143 | }
144 | ```
145 | </CodeBlock>
146 | 
147 | The comment said "do the rest non-\_\_init'ed" because `rest_init` is not defined with the `__init` macro. This means it is not freed when cleaning up init memory:
148 | 
149 | <CodeBlock name='init/main.c' startLine={689} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L689-L690'>
150 | ```c
151 | noinline void __ref rest_init(void)
152 | {
153 | ```
154 | </CodeBlock>
155 | 
156 | `rest_init` now creates a thread for the init process:
157 | 
158 | <CodeBlock name='rest_init @ init/main.c' startLine={695} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L695-L700'>
159 | ```c
160 | 	/*
161 | 	 * We need to spawn init first so that it obtains pid 1, however
162 | 	 * the init task will end up wanting to create kthreads, which, if
163 | 	 * we schedule it before we create kthreadd, will OOPS.
164 | 	 */
165 | 	pid = user_mode_thread(kernel_init, NULL, CLONE_FS);
166 | ```
167 | </CodeBlock>
168 | 
169 | The `kernel_init` parameter passed to `user_mode_thread` is a function that finishes some initialization tasks and then searches for a valid init program to execute it. This procedure starts with some basic setup tasks; I will skip through these for the most part, except for where `free_initmem` is called. This is where the kernel frees our `.init` sections!
170 | 
171 | <CodeBlock name='kernel_init @ init/main.c' startLine={1471} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L1471'>
172 | ```c
173 | 	free_initmem();
174 | ```
175 | </CodeBlock>
176 | 
177 | Now the kernel can find a suitable init program to run:
178 | 
179 | <CodeBlock name='kernel_init @ init/main.c' startLine={1495} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/init/main.c#L1495-L1525'>
180 | ```c
181 | 	/*
182 | 	 * We try each of these until one succeeds.
183 | 	 *
184 | 	 * The Bourne shell can be used instead of init if we are
185 | 	 * trying to recover a really broken machine.
186 | 	 */
187 | 	if (execute_command) {
188 | 		ret = run_init_process(execute_command);
189 | 		if (!ret)
190 | 			return 0;
191 | 		panic("Requested init %s failed (error %d).",
192 | 		      execute_command, ret);
193 | 	}
194 | 
195 | 	if (CONFIG_DEFAULT_INIT[0] != '\0') {
196 | 		ret = run_init_process(CONFIG_DEFAULT_INIT);
197 | 		if (ret)
198 | 			pr_err("Default init %s failed (error %d)\n",
199 | 			       CONFIG_DEFAULT_INIT, ret);
200 | 		else
201 | 			return 0;
202 | 	}
203 | 
204 | 	if (!try_to_run_init_process("/sbin/init") ||
205 | 	    !try_to_run_init_process("/etc/init") ||
206 | 	    !try_to_run_init_process("/bin/init") ||
207 | 	    !try_to_run_init_process("/bin/sh"))
208 | 		return 0;
209 | 
210 | 	panic("No working init found.  Try passing init= option to kernel. "
211 | 	      "See Linux Documentation/admin-guide/init.rst for guidance.");
212 | ```
213 | </CodeBlock>
214 | 
215 | On Linux, the init program is almost always located at or symbolic-linked to `/sbin/init`. Common inits include [systemd](https://systemd.io/) (which has an abnormally good website), [OpenRC](https://wiki.gentoo.org/wiki/OpenRC/openrc-init), and [runit](http://smarden.org/runit/). `kernel_init` will default to `/bin/sh` if it can't find anything else — and if it can't find `/bin/sh`, something is TERRIBLY wrong.
216 | 
217 | *MacOS has an init program, too! It's called launchd and is located at `/sbin/launchd`. Try running that in a terminal to get yelled for not being a kernel.*
218 | 
219 | From this point on, we're at step 4 in the boot process: the init process is running in userland and begins launching various programs using the fork-exec pattern.
220 | 
221 | ### Fork Memory Mapping
222 | 
223 | I was curious how the Linux kernel remaps the bottom half of memory when forking processes, so I poked around a bit. [kernel/fork.c](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/kernel/fork.c) seems to contain most of the code for forking processes. The start of that file helpfully pointed me to the right place to look:
224 | 
225 | <CodeBlock name='kernel/fork.c' startLine={8} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/kernel/fork.c#L8-L13'>
226 | ```c
227 | /*
228 |  *  'fork.c' contains the help-routines for the 'fork' system call
229 |  * (see also entry.S and others).
230 |  * Fork is rather simple, once you get the hang of it, but the memory
231 |  * management can be a bitch. See 'mm/memory.c': 'copy_page_range()'
232 |  */
233 | ```
234 | </CodeBlock>
235 | 
236 | It looks like this `copy_page_range` function takes some information about a memory mapping and copies the page tables. Quickly skimming through the functions it calls, this is also where pages are set to be read-only to make them COW pages. It checks whether it should do this by calling a function called `is_cow_mapping`.
237 | 
238 | `is_cow_mapping` is defined back in [include/linux/mm.h](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/mm.h), and returns true if the memory mapping has [flags](http://books.gigatux.nl/mirror/kerneldevelopment/0672327201/ch14lev1sec2.html) that indicate the memory is writeable and isn't shared between processes. Shared memory doesn't need to be COWed because it is designed to be shared. Admire the slightly incomprehensible bitmasking:
239 | 
240 | <CodeBlock name='include/linux/mm.h' startLine={1541} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/mm.h#L1541-L1544'>
241 | ```c
242 | static inline bool is_cow_mapping(vm_flags_t flags)
243 | {
244 | 	return (flags & (VM_SHARED | VM_MAYWRITE)) == VM_MAYWRITE;
245 | }
246 | ```
247 | </CodeBlock>
248 | 
249 | Back in [kernel/fork.c](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/kernel/fork.c), doing a simple Command-F for `copy_page_range` yields one call from the `dup_mmap` function... which is in turn called by `dup_mm`... which is called by `copy_mm`... which is finally called by the massive `copy_process` function! `copy_process` is the core of the fork function, and, in a way, the centerpoint of how Unix systems execute programs — always copying and editing a template created for the first process at startup.
250 | 
251 | <iframe width="560" height="315" src="https://www.youtube.com/embed/FavUpD_IjVY" title="YouTube video player" frameborder="0" style="aspect-ratio: 16 / 9;" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen />
252 | 
253 | ## In Summary...
254 | 
255 | ***So... how do programs run?***
256 | 
257 | On the lowest level: processors are dumb. They have a pointer into memory and execute instructions in a row, unless they reach an instruction that tells them to jump somewhere else.
258 | 
259 | Besides jump instructions, hardware and software interrupts can also break the sequence of execution by jumping to a preset location that can then choose where to jump to. Processor cores can't run multiple programs at once, but this can be simulated by using a timer to repeatedly trigger interrupts and allowing kernel code to switch between different code pointers.
260 | 
261 | Programs are *tricked* into believing they're running as a coherent, isolated unit. Direct access to system resources is prevented in user mode, memory space is isolated using paging, and system calls are designed to allow generic I/O access without too much knowledge about the true execution context. System calls are instructions that ask the CPU to run some kernel code, the location of which is configured by the kernel at startup.
262 | 
263 | ***But... how do programs run?***
264 | 
265 | After the computer starts up, the kernel launches the init process. This is the first program running at the higher level of abstraction where its machine code doesn't have to worry about many specific system details. The init program launches the programs that render your computer's graphical environment and are responsible for launching other software.
266 | 
267 | To launch a program, it clones itself with the fork syscall. This cloning is efficient because all of the memory pages are COW and the memory doesn't need to be copied within physical RAM. On Linux, this is the `copy_process` function in action.
268 | 
269 | Both processes check if they're the forked process. If they are, they use an exec syscall to ask the kernel to replace the current process with a new program.
270 | 
271 | The new program is probably an ELF file, which the kernel parses to find information on how to load the program and where to place its code and data within the new virtual memory mapping. The kernel might also prepare an ELF interpreter if the program is dynamically linked.
272 | 
273 | The kernel can then load the program's virtual memory mapping and return to userland with the program running, which really means setting the CPU's instruction pointer to the start of the new program's code in virtual memory.
274 | 


--------------------------------------------------------------------------------
/src/content/chapters/5-the-translator-in-your-computer.mdx:
--------------------------------------------------------------------------------
  1 | ---
  2 | chapter: 5
  3 | title: The Translator in Your Computer
  4 | shortname: Paging
  5 | slug: the-translator-in-your-computer
  6 | updatedAt: 2023-08-15T18:49:01.686Z
  7 | ---
  8 | 
  9 | import CodeBlock from '../../components/CodeBlock.astro'
 10 | 
 11 | Up until now, every time I've talked about reading and writing memory was a little wishy-washy. For example, ELF files specify specific memory addresses to load data into, so why aren't there problems with different processes trying to use conflicting memory? Why does each process seem to have a different memory environment?
 12 | 
 13 | Also, how exactly did we get here? We understand that `execve` is a syscall that *replaces* the current process with a new program, but this doesn't explain how multiple processes can be started. It definitely doesn't explain how the very first program runs — what chicken (process) lays (spawns) all the other eggs (other processes)?
 14 | 
 15 | We're nearing the end of our journey. After these two questions are answered, we'll have a mostly complete understanding of how your computer got from bootup to running the software you're using right now.
 16 | 
 17 | ## Memory is Fake
 18 | 
 19 | So... about memory. It turns out that when the CPU reads from or writes to a memory address, it's not actually referring to that location in *physical* memory (RAM). Rather, it's pointing to a location in *virtual* memory space.
 20 |  
 21 | The CPU talks to a chip called a [*memory management unit*](https://en.wikipedia.org/wiki/Memory_management_unit) (MMU). The MMU works like a translator with a dictionary that translates locations in virtual memory to locations in RAM. When the CPU is given an instruction to read from memory address `0xfffaf54834067fe2`, it asks the MMU to translate that address. The MMU looks it up in the dictionary, discovers that the matching physical address is `0x53a4b64a90179fe2`, and sends the number back to the CPU. The CPU can then read from that address in RAM.
 22 | 
 23 | <img src='images/virtual-memory-mmu-example.png' loading='eager' style='max-width: 640px; margin: 0 auto;' alt='A drawing of a smiling CPU and an MMU having a conversation. The MMU is a tall chip, wearing library glasses, and holding a large book labeled "Dictionary: Pointers 0x0000 to 0xffff." The CPU asks the MMU to translate a long memory address. The MMU thinks for a second, and responds with a different pointer.' width='1207' height='454' />
 24 | 
 25 | When the computer first boots up, memory accesses go directly to physical RAM. Immediately after startup, the OS creates the translation dictionary and tells the CPU to start using the MMU.
 26 | 
 27 | This dictionary is actually called a *page table*, and this system of translating every memory access is called *paging*. Entries in the page table are called *pages* and each one represents how a certain chunk of virtual memory maps to RAM. These chunks are always a fixed size, and each processor architecture has a different page size. x86-64 has a default 4 KiB page size, meaning each page specifies the mapping for a block of memory 4,096 bytes long.
 28 | 
 29 | In other words, with 4 KiB pages the bottom 12 bits of an address will always be the same before and after MMU translation — 12, because that's the amount of bits needed to index the 4,096-byte page you get post-translation.
 30 | 
 31 | x86-64 also allows operating systems to enable larger 2 MiB or 4 GiB pages, which can improve address translation speed but increase memory fragmentation and waste. The larger the page size, the smaller the portion of the address that's translated by the MMU.
 32 | 
 33 | <img src='images/4kib-paging-address-breakdown.png' loading='lazy' style='max-width: 400px; margin: 0 auto;' alt='A breakdown of a memory address with 4 KiB paging. The lowest 12 bits index the page, and the rest of the bits are translated by the MMU and become the page&apos;s start address.' width='760' height='310' />
 34 | 
 35 | The page table itself just resides in RAM. While it can contain millions of entries, each entry's size is only on the order of a couple bytes, so the page table doesn't take up too much space.
 36 | 
 37 | To enable paging at boot, the kernel first constructs the page table in RAM. Then, it stores the physical address of the start of the page table in a register called the page table base register (PTBR). Finally, the kernel enables paging to translate all memory accesses with the MMU. On x86-64, the top 20 bits of control register 3 (CR3) function as the PTBR. Bit 31 of CR0, designated PG for Paging, is set to 1 to enable paging.
 38 | 
 39 | The magic of the paging system is that the page table can be edited while the computer is running. This is how each process can have its own isolated memory space — when the OS switches context from one process to another, an important task is remapping the virtual memory space to a different area in physical memory. Let's say you have two processes: process A can have its code and data (likely loaded from an ELF file!) at `0x0000000000400000`, and process B can access its code and data from the very same address. Those two processes can even be instances of the same program, because they aren't actually fighting over that address range! The data for process A is somewhere far from process B in physical memory, and is mapped to `0x0000000000400000` by the kernel when switching to the process.
 40 | 
 41 | <img src='images/process-virtual-memory-mapping.png' loading='lazy' alt='A diagram showing two different processes asking a cheesy clip art image of an anthropomorphic desktop computer to translate the same memory address. The anthropomorphic computer responds to each process with a different section from within the continuous strip of physical memory.' width='2101' height='1010' />
 42 | 
 43 | > **Aside: cursed ELF fact**
 44 | >
 45 | > In certain situations, `binfmt_elf` has to map the first page of memory to zeroes. Some programs written for UNIX System V Release 4.0 (SVr4), an OS from 1988 that was the first to support ELF, rely on null pointers being readable. And somehow, some programs still rely on that behavior.
 46 | >
 47 | > It seems like the Linux kernel dev implementing this was [a little disgruntled](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/fs/binfmt_elf.c#L1322-L1329):
 48 | >
 49 | > *"Why this, you ask???  Well SVr4 maps page 0 as read-only, and some applications 'depend' upon this behavior. Since we do not have the power to recompile these, we emulate the SVr4 behavior. Sigh."*
 50 | >
 51 | > Sigh.
 52 | 
 53 | ## Security with Paging
 54 | 
 55 | The process isolation enabled by memory paging improves code ergonomics (processes don't need to be aware of other processes to use memory), but it also creates a level of security: processes cannot access memory from other processes. This half answers one of the original questions from the start of this article:
 56 | 
 57 | > If programs run directly on the CPU, and the CPU can directly access RAM, why can't code access memory from other processes, or, god forbid, the kernel?
 58 | 
 59 | *Remember that? It feels like so long ago...*
 60 | 
 61 | What about that kernel memory, though? First things first: the kernel obviously needs to store plenty of data of its own to keep track of all the processes running and even the page table itself. Every time a hardware interrupt, software interrupt, or system call is triggered and the CPU enters kernel mode, the kernel code needs to access that memory somehow.
 62 | 
 63 | Linux's solution is to always allocate the top half of the virtual memory space to the kernel, so Linux is called a [*higher half kernel*](https://wiki.osdev.org/Higher_Half_Kernel). Windows employs a [similar](https://learn.microsoft.com/en-us/windows-hardware/drivers/kernel/overview-of-windows-memory-space) technique, while macOS is... [slightly](https://www.researchgate.net/figure/Overview-of-the-Mac-OS-X-virtual-memory-system-which-resides-inside-the-Mach-portion-of_fig1_264086271) [more](https://developer.apple.com/library/archive/documentation/Performance/Conceptual/ManagingMemory/Articles/AboutMemory.html) [complicated](https://developer.apple.com/library/archive/documentation/Darwin/Conceptual/KernelProgramming/vm/vm.html) and caused my brain to ooze out of my ears reading about it. \~(++)\~
 64 | 
 65 | <img src='images/higher-half-kernel-memory-map.png' loading='lazy' alt='A diagram showing virtual memory space as a strip. The left half is labeled user space: memory for the executing program. The right half is labeled kernel space: fixed area for everything kernel-related. The middle point splitting the two segments is labeled with the memory address 0x8000000000000000.' width='2161' height='230' />
 66 | 
 67 | It would be terrible for security if userland processes could read or write kernel memory though, so paging enables a second layer of security: each page must specify permission flags. One flag determines whether the region is writable or only readable. Another flag tells the CPU that only kernel mode is allowed to access the region's memory. This latter flag is used to protect the entire higher half kernel space — the entire kernel memory space is actually available in the virtual memory mapping for user space programs, they just don't have the permissions to access it.
 68 | 
 69 | <img src='images/page-table-entry-permissions.png' loading='lazy' style='max-width: 260px;' alt='A table of page table entry permissions. Present: true. Read/write: read only. User/kernel: all modes. Dirty: false. Accessed: true. Etcetera.' width='650' height='639' />
 70 | 
 71 | The page table itself is actually contained within the kernel memory space! When the timer chip triggers a hardware interrupt for process switching, the CPU switches the privilege level to kernel mode and jumps to Linux kernel code. Being in kernel mode (Intel ring 0) allows the CPU to access the kernel-protected memory region. The kernel can then write to the page table (residing somewhere in that upper half of memory) to remap the lower half of virtual memory for the new process. When the kernel switches to the new process and the CPU enters user mode, it can no longer access any of the kernel memory.
 72 | 
 73 | Just about every memory access goes through the MMU. Interrupt descriptor table handler pointers? Those address the kernel's virtual memory space as well.
 74 | 
 75 | ## Hierarchical Paging and Other Optimizations
 76 | 
 77 | 64-bit systems have memory addresses that are 64 bits long, meaning the 64-bit virtual memory space is a whopping 16 [exbibytes](https://en.wiktionary.org/wiki/exbibyte) in size. That is incredibly large, far larger than any computer that exists today or will exist any time soon. As far as I can tell, the most RAM in any computer ever was in the [Blue Waters supercomputer](https://en.wikipedia.org/wiki/Blue_Waters), with over 1.5 petabytes of RAM. That's still less than 0.01% of 16 EiB.
 78 | 
 79 | If an entry in the page table was required for every 4 KiB section of virtual memory space, you would need 4,503,599,627,370,496 page table entries. With 8-byte-long page table entries, you would need 32 pebibytes of RAM just to store the page table alone. You may notice that's still larger than the world record for the most RAM in a computer.
 80 | 
 81 | > **Aside: why the weird units?**
 82 | > 
 83 | > I know it's uncommon and really ugly, but I find it important to clearly differentiate between binary byte size units (powers of 2) and metric ones (powers of 10). A kilobyte, kB, is an SI unit that means 1,000 bytes. A kibibyte, KiB, is an IEC-recommended unit that means 1,024 bytes. In terms of CPUs and memory addresses, byte counts are usually powers of two because computers are binary systems. Using KB (or worse, kB) to mean 1,024 would be more ambiguous.
 84 | 
 85 | Since it would be impossible (or at least incredibly impractical) to have sequential page table entries for the entire possible virtual memory space, CPU architectures implement *hierarchical paging*. In hierarchical paging systems, there are multiple levels of page tables of increasingly small granularity. The top level entries cover large blocks of memory and point to page tables of smaller blocks, creating a tree structure. The individual entries for blocks of 4 KiB or whatever the page size is are the leaves of the tree.
 86 | 
 87 | x86-64 historically uses 4-level hierarchical paging. In this system, each page table entry is found by offsetting the start of the containing table by a portion of the address. This portion starts with the most significant bits, which work as a prefix so the entry covers all addresses starting with those bits. The entry points to the start of the next level of table containing the subtrees for that block of memory, which are again indexed with the next collection of bits.
 88 | 
 89 | The designers of x86-64's 4-level paging also chose to ignore the top 16 bits of all virtual pointers to save page table space. 48 bits gets you a 128 TiB virtual address space, which was deemed to be large enough. (The full 64 bits would get you 16 EiB, which is kind of a lot.)
 90 | 
 91 | Since the first 16 bits are skipped, the "most significant bits" for indexing the first level of the page table actually start at bit 47 rather than 63. This also means the higher half kernel diagram from earlier in this chapter was technically inaccurate; the kernel space start address should've been depicted as the midpoint of an address space smaller than 64 bits.
 92 | 
 93 | <img src='images/multilevel-paging-explainer.png' loading='lazy' class='big' alt='A large, detailed, and full-color diagram of 4-level paging on x86-64. It depicts the four levels of page tables, highlighting the bits that serve as a "prefix" at each level. It also shows the tables being indexed by those prefix bits by adding the value of the bits to the table&apos;s base address. The entries in each table point to the start of the next table, except for the final level 1 which points to the start of a 4 KiB block in RAM. The MMU adds the lowest 12 bits to that address to get the final physical address. There is one level 4 table, n-squared level 3 tables, and so on.' width='2981' height='1118' />
 94 | 
 95 | Hierarchical paging solves the space problem because at any level of the tree, the pointer to the next entry can be null (`0x0`). This allows entire subtrees of the page table to be elided, meaning unmapped areas of the virtual memory space don't take up any space in RAM. Lookups at unmapped memory addresses can fail quickly because the CPU can error as soon as it sees an empty entry higher up in the tree. Page table entries also have a presence flag that can be used to mark them as unusable even if the address appears valid.
 96 | 
 97 | Another benefit of hierarchical paging is the ability to efficiently switch out large sections of the virtual memory space. A large swath of virtual memory might be mapped to one area of physical memory for one process, and a different area for another process. The kernel can store both mappings in memory and simply update the pointers at the top level of the tree when switching processes. If the entire memory space mapping was stored as a flat array of entries, the kernel would have to update a lot of entries, which would be slow and still require independently keeping track of the memory mappings for each process.
 98 | 
 99 | I said x86-64 "historically" uses 4-level paging because recent processors implement [5-level paging](https://en.wikipedia.org/wiki/Intel_5-level_paging). 5-level paging adds another level of indirection as well as 9 more addressing bits to expand the address space to 128 PiB with 57-bit addresses. 5-level paging is supported by operating systems including Linux [since 2017](https://lwn.net/Articles/717293/) as well as recent Windows 10 and 11 server versions.
100 | 
101 | > **Aside: physical address space limits**
102 | > 
103 | > Just as operating systems don't use all 64 bits for virtual addresses, processors don't use entire 64-bit physical addresses. When 4-level paging was the standard, x86-64 CPUs didn't use more than 46 bits, meaning the physical address space was limited to only 64 TiB. With 5-level paging, support has been extended to 52 bits, supporting a 4 PiB physical address space.
104 | >
105 | > On the OS level, it's advantageous for the virtual address space to be larger than the physical address space. As Linus Torvalds [said](https://www.realworldtech.com/forum/?threadid=76912&curpostid=76973), "[i]t needs to be bigger, by a factor of _at least_ two, and that's quite frankly pushing it, and you're much better off having a factor of ten or more. Anybody who doesn't get that is a moron. End of discussion."
106 | 
107 | ## Swapping and Demand Paging
108 | 
109 | A memory access might fail for a couple reasons: the address might be out of range, it might not be mapped by the page table, or it might have an entry that's marked as not present. In any of these cases, the MMU will trigger a hardware interrupt called a *page fault* to let the kernel handle the problem.
110 | 
111 | In some cases, the read was truly invalid or prohibited. In these cases, the kernel will probably terminate the program with a [segmentation fault](https://en.wikipedia.org/wiki/Segmentation_fault) error.
112 | 
113 | <CodeBlock name='Shell session'>
114 | ```
115 | $ ./program
116 | Segmentation fault (core dumped)
117 | $
118 | ```
119 | </CodeBlock>
120 | 
121 | > **Aside: segfault ontology**
122 | > 
123 | > "Segmentation fault" means different things in different contexts. The MMU triggers a hardware interrupt called a "segmentation fault" when memory is read without permission, but "segmentation fault" is also the name of a signal the OS can send to running programs to terminate them due to any illegal memory access.
124 | 
125 | In other cases, memory accesses can *intentionally* fail, allowing the OS to populate the memory and then *hand control back to the CPU to try again*. For example, the OS can map a file on disk to virtual memory without actually loading it into RAM, and then load it into physical memory when the address is requested and a page fault occurs. This is called *demand paging*.
126 | 
127 | <img src='images/demand-paging-with-page-faults-comic.png' loading='lazy' class='big' alt='A three-panel comic style diagram about how demand paging is implemented with hardware interrupts. Panel 1: the CPU having a conversation with the MMU. The CPU says "read 0xfff," the MMU looks confused, and then the MMU sends a lightning to the CPU labeled "page fault!" Panel 2 is labeled "page fault handler" and has a zig-zag outline. It depicts the CPU loading some data into RAM, and then returning from the interrupt. Finally, panel 3 is back to the CPU and MMU conversing. The MMU thinks to itself, "Oh hey, the page is present now." It replies to the CPU&apos;s original request: "Here&apos;s your memory!" The CPU says thank you.' width='3001' height='703' style='--max-width: 1000px;' />
128 | 
129 | For one, this allows syscalls like [mmap](https://man7.org/linux/man-pages/man2/mmap.2.html) that lazily map entire files from disk to virtual memory to exist. If you're familiar with LLaMa.cpp, a runtime for a leaked Facebook language model, Justine Tunney recently significantly optimized it by [making all the loading logic use mmap](https://justine.lol/mmap/). (If you haven't heard of her before, [check her stuff out](https://justine.lol/)! Cosmopolitan Libc and APE are really cool and might be interesting if you've been enjoying this article.)
130 | 
131 | > *Apparently there's a [lot](https://rentry.org/Jarted) [of](https://news.ycombinator.com/item?id=35413289) [drama](https://news.ycombinator.com/item?id=35458004) about Justine's involvement in this change. Just pointing this out so I don't get screamed at by random internet users. I must confess that I haven't read most of the drama, and everything I said about Justine's stuff being cool is still very true.*
132 | 
133 | When you execute a program and its libraries, the kernel doesn't actually load anything into memory. It only creates an mmap of the file — when the CPU tries to execute the code, the page immediately faults and the kernel replaces the page with a real block of memory.
134 | 
135 | Demand paging also enables the technique that you've probably seen under the name "swapping" or "paging." Operating systems can free up physical memory by writing memory pages to disk and then removing them from physical memory but keeping them in virtual memory with the present flag set to 0. If that virtual memory is read, the OS can then restore the memory from disk to RAM and set the present flag back to 1. The OS may have to swap a different section of RAM to make space for the memory being loaded from disk. Disk reads and writes are slow, so operating systems try to make swapping happen as little as possible with [efficient page replacement algorithms](https://en.wikipedia.org/wiki/Page_replacement_algorithm).
136 | 
137 | An interesting hack is to use page table physical memory pointers to store the locations of files within physical storage. Since the MMU will page fault as soon as it sees a negative present flag, it doesn't matter that they are invalid memory addresses. This isn't practical in all cases, but it's amusing to think about.
138 | 


--------------------------------------------------------------------------------
/src/content/chapters/3-how-to-run-a-program.mdx:
--------------------------------------------------------------------------------
  1 | ---
  2 | chapter: 3
  3 | title: How to Run a Program
  4 | shortname: Exec
  5 | slug: how-to-run-a-program
  6 | updatedAt: 2023-07-24T15:57:08.044Z
  7 | ---
  8 | 
  9 | import CodeBlock from '../../components/CodeBlock.astro'
 10 | 
 11 | So far, we've covered how CPUs execute machine code loaded from executables, what ring-based security is, and how syscalls work. In this section, we'll dive deep into the Linux kernel to figure out how programs are loaded and run in the first place.
 12 | 
 13 | We're specifically going to look at Linux on x86-64. Why?
 14 | 
 15 | - Linux is a fully featured production OS for desktop, mobile, and server use cases. Linux is open source, so it's super easy to research just by reading its source code. I will be directly referencing some kernel code in this article!
 16 | - x86-64 is the architecture that most modern desktop computers use, and the target architecture of a lot of code. The subset of behavior I mention that is x86-64-specific will generalize well.
 17 | 
 18 | Most of what we learn will generalize well to other operating systems and architectures, even if they differ in various specific ways.
 19 | 
 20 | ## Basic Behavior of Exec Syscalls
 21 | 
 22 | <img src='images/linux-program-execution-process.png' loading='eager' style='max-width: 600px; margin: 0 auto;' alt='A flowchart demonstrating exec syscalls. On the left, a group of flowchart items labeled "user space," on the right, a group labeled "kernel space." Starting in the user space group: the user runs ./file.bin in their terminal, which then runs the syscall execve("./file.bin", ...). This flows to the SYSCALL instruction being executed, which then points to the first item in the kernel space group: "Load and set up a binary" which points to "Try a binfmt." If the binfmt is supported, it starts the new process (replacing the current). If not, it tries the binfmt again.' width='917' height='424' />
 23 | 
 24 | Let's start with a very important system call: `execve`. It loads a program and, if successful, replaces the current process with that program. A couple other syscalls (`execlp`, `execvpe`, etc.) exist, but they all layer on top of `execve` in various fashions.
 25 | 
 26 | > **Aside: `execveat`**
 27 | > 
 28 | > `execve` is *actually* built on top of `execveat`, a more general syscall that runs a program with some configuration options. For simplicity, we'll mostly talk about `execve`; the only difference is that it provides some defaults to `execveat`.
 29 | >
 30 | > Curious what `ve` stands for? The `v` means one parameter is the vector (list) of arguments (`argv`), and the `e` means another parameter is the vector of environment variables (`envp`). Various other exec syscalls have different suffixes to designate different call signatures. The `at` in `execveat` is just "at", because it specifies the location to run `execve` at.
 31 | 
 32 | The call signature of `execve` is:
 33 | 
 34 | <CodeBlock>
 35 | ```c
 36 | int execve(const char *filename, char *const argv[], char *const envp[]);
 37 | ```
 38 | </CodeBlock>
 39 | 
 40 | - The `filename` argument specifies a path to the program to run.
 41 | - `argv` is a null-terminated (meaning the last item is a null pointer) list of arguments to the program. The `argc` argument you'll commonly see passed to C main functions is actually calculated later by the syscall, thus the null-termination.
 42 | - The `envp` argument contains another null-terminated list of environment variables used as context for the application. They're... conventionally `KEY=VALUE` pairs. *Conventionally.* I love computers.
 43 | 
 44 | Fun fact! You know that convention where a program's first argument is the name of the program? That's *purely a convention*, and isn't actually set by the `execve` syscall itself! The first argument will be whatever is passed to `execve` as the first item in the `argv` argument, even if it has nothing to do with the program name.
 45 | 
 46 | Interestingly, `execve` does have some code that assumes `argv[0]` is the program name. More on this later when we talk about interpreted scripting languages.
 47 | 
 48 | ### Step 0: Definition
 49 | 
 50 | We already know how syscalls work, but we've never seen a real-world code example! Let's look at the Linux kernel's source code to see how `execve` is defined under the hood:
 51 | 
 52 | <CodeBlock name='fs/exec.c' startLine={2105} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/fs/exec.c#L2105-L2111'>
 53 | ```c
 54 | SYSCALL_DEFINE3(execve,
 55 | 		const char __user *, filename,
 56 | 		const char __user *const __user *, argv,
 57 | 		const char __user *const __user *, envp)
 58 | {
 59 | 	return do_execve(getname(filename), argv, envp);
 60 | }
 61 | ```
 62 | </CodeBlock>
 63 | 
 64 | `SYSCALL_DEFINE3` is a macro for defining a 3-argument system call's code.
 65 | 
 66 | > I was curious why the [arity](https://en.wikipedia.org/wiki/Arity) is hardcoded in the macro name; I googled around and learned that this was a workaround to fix [some security vulnerability](https://nvd.nist.gov/vuln/detail/CVE-2009-0029).
 67 | 
 68 | The filename argument is passed to a `getname()` function, which copies the string from user space to kernel space and does some usage tracking things. It returns a `filename` struct, which is defined in `include/linux/fs.h`. It stores a pointer to the original string in user space as well as a new pointer to the value copied to kernel space:
 69 | 
 70 | <CodeBlock name='include/linux/fs.h' startLine={2294} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/fs.h#L2294-L2300'>
 71 | ```c
 72 | struct filename {
 73 | 	const char		*name;	/* pointer to actual string */
 74 | 	const __user char	*uptr;	/* original userland pointer */
 75 | 	int			refcnt;
 76 | 	struct audit_names	*aname;
 77 | 	const char		iname[];
 78 | };
 79 | ```
 80 | </CodeBlock>
 81 | 
 82 | The `execve` system call then calls a `do_execve()` function. This, in turn, calls `do_execveat_common()`with some defaults. The `execveat` syscall which I mentioned earlier also calls `do_execveat_common()`, but passes through more user-provided options.
 83 | 
 84 | In the below snippet, I've included the definitions of both `do_execve` and `do_execveat`:
 85 | 
 86 | <CodeBlock name='fs/exec.c' startLine={2028} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/fs/exec.c#L2028-L2046'>
 87 | ```c
 88 | static int do_execve(struct filename *filename,
 89 | 	const char __user *const __user *__argv,
 90 | 	const char __user *const __user *__envp)
 91 | {
 92 | 	struct user_arg_ptr argv = { .ptr.native = __argv };
 93 | 	struct user_arg_ptr envp = { .ptr.native = __envp };
 94 | 	return do_execveat_common(AT_FDCWD, filename, argv, envp, 0);
 95 | }
 96 | 
 97 | static int do_execveat(int fd, struct filename *filename,
 98 | 		const char __user *const __user *__argv,
 99 | 		const char __user *const __user *__envp,
100 | 		int flags)
101 | {
102 | 	struct user_arg_ptr argv = { .ptr.native = __argv };
103 | 	struct user_arg_ptr envp = { .ptr.native = __envp };
104 | 
105 | 	return do_execveat_common(fd, filename, argv, envp, flags);
106 | }
107 | ```
108 | </CodeBlock>
109 | 
110 | \[spacing sic\]
111 | 
112 | In `execveat`, a file descriptor (a type of id that points to *some resource*) is passed to the syscall and then to `do_execveat_common`. This specifies the directory to execute the program relative to.
113 | 
114 | In `execve`, a special value is used for the file descriptor argument, `AT_FDCWD`. This is a shared constant in the Linux kernel that tells functions to interpret pathnames as relative to the current working directory. Functions that accept file descriptors usually include a manual check like <code>if&nbsp;(fd&nbsp;==&nbsp;AT_FDCWD) \{&nbsp;/\*&nbsp;special codepath&nbsp;\*/&nbsp;\}</code>.
115 | 
116 | ### Step 1: Setup
117 | 
118 | We've now reached `do_execveat_common`, the core function handling program execution. We're going to take a brief step back from staring at code to get a bigger picture view of what this function does.
119 | 
120 | The first major job of `do_execveat_common` is setting up a struct called `linux_binprm`. I won't include a copy of [the whole struct definition](https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/binfmts.h#L15-L65), but there are several important fields to go over:
121 | 
122 | - Data structures like `mm_struct` and `vm_area_struct` are defined to prepare virtual memory management for the new program.
123 | - `argc` and `envc` are calculated and stored to be passed to the program.
124 | - `filename` and `interp` store the filename of the program and its interpreter, respectively. These start out equal to each other, but can change in some cases: one such case is when running interpreted scripts with a [shebang](https://en.wikipedia.org/wiki/Shebang_(Unix)). When executing a Python program, for example, `filename` points to the source file but `interp` is the path to the Python interpreter.
125 | - `buf` is an array filled with the first 256 bytes of the file to be executed. It's used to detect the format of the file and load script shebangs.
126 | 
127 | (TIL: binprm stands for **bin**ary **pr**og**r**a**m**.)
128 | 
129 | Let's take a closer look at this buffer `buf`:
130 | 
131 | <CodeBlock name='linux_binprm @ include/linux/binfmts.h' startLine={64} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/linux/binfmts.h#L64'>
132 | ```c
133 | 	char buf[BINPRM_BUF_SIZE];
134 | ```
135 | </CodeBlock>
136 | 
137 | As we can see, its length is defined as the constant `BINPRM_BUF_SIZE`. By searching the codebase for this string, we can find a definition for this in `include/uapi/linux/binfmts.h`:
138 | 
139 | <CodeBlock name='include/uapi/linux/binfmts.h' startLine={18} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/include/uapi/linux/binfmts.h#L18-L19'>
140 | ```c
141 | /* sizeof(linux_binprm->buf) */
142 | #define BINPRM_BUF_SIZE 256
143 | ```
144 | </CodeBlock>
145 | 
146 | So, the kernel loads the opening 256 bytes of the executed file into this memory buffer.
147 | 
148 | > **Aside: what's a UAPI?**
149 | > 
150 | > You might notice that the above code's path contains `/uapi/`. Why isn't the length defined in the same file as the `linux_binprm` struct, `include/linux/binfmts.h`?
151 | >
152 | > UAPI stands for "userspace API." In this case, it means someone decided that the length of the buffer should be part of the kernel's public API. In theory, everything UAPI is exposed to userland, and everything non-UAPI is private to kernel code.
153 | >
154 | > Kernel and user space code originally coexisted in one jumbled mass. In 2012, UAPI code was [refactored into a separate directory](https://lwn.net/Articles/507794/) as an attempt to improve maintainability.
155 | 
156 | ### Step 2: Binfmts
157 | 
158 | The kernel's next major job is iterating through a bunch of "binfmt" (binary format) handlers. These handlers are defined in files like `fs/binfmt_elf.c` and `fs/binfmt_flat.c`. [Kernel modules](https://wiki.archlinux.org/title/Kernel_module) can also add their own binfmt handlers to the pool.
159 | 
160 | Each handler exposes a `load_binary()` function which takes a `linux_binprm` struct and checks if the handler understands the program's format.
161 | 
162 | This often involves looking for [magic numbers](https://en.wikipedia.org/wiki/Magic_number_(programming)) in the buffer, attempting to decode the start of the program (also from the buffer), and/or checking the file extension. If the handler does support the format, it prepares the program for execution and returns a success code. Otherwise, it quits early and returns an error code.
163 | 
164 | The kernel tries the `load_binary()` function of each binfmt until it reaches one that succeeds. Sometimes these will run recursively; for example, if a script has an interpreter specified and that interpreter is, itself, a script, the hierarchy might be `binfmt_script` > `binfmt_script` > `binfmt_elf` (where ELF is the executable format at the end of the chain).
165 | 
166 | ### Format Highlight: Scripts
167 | 
168 | Of the many formats Linux supports, `binfmt_script` is the first I want to specifically talk about.
169 | 
170 | Have you ever read or written a [shebang](https://en.wikipedia.org/wiki/Shebang_(Unix))? That line at the start of some scripts that specifies the path to the interpreter?
171 | 
172 | <CodeBlock startLine={1}>
173 | ```bash
174 | #!/bin/bash
175 | ```
176 | </CodeBlock>
177 | 
178 | I always just assumed these were handled by the shell, but no! Shebangs are actually a feature of the kernel, and scripts are executed with the same syscalls as every other program. Computers are *so cool*.
179 | 
180 | Take a look at how `fs/binfmt_script.c` checks if a file starts with a shebang:
181 | 
182 | <CodeBlock name='load_script @ fs/binfmt_script.c' startLine={40} sourceUrl='https://github.com/torvalds/linux/blob/22b8cc3e78f5448b4c5df00303817a9137cd663f/fs/binfmt_script.c#L40-L42'>
183 | ```c
184 | 	/* Not ours to exec if we don't start with "#!". */
185 | 	if ((bprm->buf[0] != '#') || (bprm->buf[1] != '!'))
186 | 		return -ENOEXEC;
187 | ```
188 | </CodeBlock>
189 | 
190 | If the file does start with a shebang, the binfmt handler then reads the interpreter path and any space-separated arguments after the path. It stops when it hits either a newline or the end of the buffer.
191 | 
192 | There are two interesting, wonky things going on here.
193 | 
194 | **First of all**, remember that buffer in `linux_binprm` that was filled with the first 256 bytes of the file? That's used for executable format detection, but that same buffer is also what shebangs are read out of in `binfmt_script`.
195 | 
196 | During my research, I read an article that described the buffer as 128 bytes long. At some point after that article was published, the length was doubled to 256 bytes! Curious why, I checked the Git blame — a log of everybody who edited a certain line of code — for the line where `BINPRM_BUF_SIZE` is defined in the Linux source code. Lo and behold...
197 | 
198 | <img src='images/binprm-buf-changelog.png' loading='lazy' style='max-width: 550px;' alt='A screenshot of a Git blame window from the Visual Studio Code editor. The git blame shows the line "#define BINPRM_BUF_SIZE 128" being changed to 256. The commit is by Oleg Nesterov, and the main text is "exec: increase BINPRM_BUF_SIZE to 256. Large enterprise clients often run applications out of networked file systems where the IT mandated layout of project volumes can end up leading to paths that are longer than 128 characters.  Bumping this up to the next order of two solves this problem in all but the most egregious case while still fitting into a 512b slab." The commit is signed off by Linus Torvalds, among others.' width='942' height='968' />
199 | 
200 | COMPUTERS ARE SO COOL!
201 | 
202 | Since shebangs are handled by the kernel, and pull from `buf` instead of loading the whole file, they're *always* truncated to the length of `buf`. Apparently, 4 years ago, someone got annoyed by the kernel truncating their >128-character paths, and their solution was to double the truncation point by doubling the buffer size! Today, on your very own Linux machine, if you have a shebang line more than 256 characters long, everything past 256 characters will be *completely lost*.
203 | 
204 | <img src='images/linux-shebang-truncation.png' loading='lazy' style='max-width: 500px;' alt='A diagram depicting shebang truncation. A large array of bytes from a file named file.bin. The first 256 bytes are highlighted and labeled "Loaded into buf," while the remaining bytes are translucent and labeled "Ignored, past 256 bytes."' width='730' height='548' />
205 | 
206 | Imagine having a bug because of this. Imagine trying to figure out the root cause of what's breaking your code. Imagine how it would feel, discovering that the problem is deep within the Linux kernel. Woe to the next IT person at a massive enterprise who discovers that part of a path has mysteriously gone missing.
207 | 
208 | **The second wonky thing:** remember how it's only *convention* for `argv[0]` to be the program name, how the caller can pass any `argv` they want to an exec syscall and it will pass through unmoderated?
209 | 
210 | It just so happens that `binfmt_script` is one of those places that *assumes* `argv[0]` is the program name. It always removes `argv[0]`, and then adds the following to the start of `argv`:
211 | 
212 | - Path to the interpreter
213 | - Arguments to the interpreter
214 | - Filename of the script
215 | 
216 | <blockquote>
217 | **Example: Argument Modification**
218 | 
219 | Let's look at a sample `execve` call:
220 | 
221 | <CodeBlock>
222 | ```c
223 | // Arguments: filename, argv, envp
224 | execve("./script", [ "A", "B", "C" ], []);
225 | ```
226 | </CodeBlock>
227 | 
228 | This hypothetical `script` file has the following shebang as its first line:
229 | 
230 | <CodeBlock name='script' startLine={1}>
231 | ```js
232 | #!/usr/bin/node --experimental-module
233 | ```
234 | </CodeBlock>
235 | 
236 | The modified `argv` finally passed to the Node interpreter will be:
237 | 
238 | <CodeBlock>
239 | ```c
240 | [ "/usr/bin/node", "--experimental-module", "./script", "B", "C" ]
241 | ```
242 | </CodeBlock>
243 | </blockquote>
244 | 
245 | After updating `argv`, the handler finishes preparing the file for execution by setting `linux_binprm.interp` to the interpreter path (in this case, the Node binary). Finally, it returns 0 to indicate success preparing the program for execution.
246 | 
247 | ### Format Highlight: Miscellaneous Interpreters
248 | 
249 | Another interesting handler is `binfmt_misc`. It opens up the ability to add some limited formats through userland configuration, by mounting a special file system at `/proc/sys/fs/binfmt_misc/`. Programs can perform [specially formatted](https://docs.kernel.org/admin-guide/binfmt-misc.html) writes to files in this directory to add their own handlers. Each configuration entry specifies:
250 | 
251 | - How to detect their file format. This can specify either a magic number at a certain offset or a file extension to look for.
252 | - The path to an interpreter executable. There's no way to specify interpreter arguments, so a wrapper script is needed if those are desired.
253 | - Some configuration flags, including one specifying how `binfmt_misc` updates `argv`.
254 | 
255 | This `binfmt_misc` system is often used by Java installations, configured to detect class files by their `0xCAFEBABE` magic bytes and JAR files by their extension. On my particular system, a  handler is configured that detects Python bytecode by its .pyc extension and passes it to the appropriate handler.
256 | 
257 | This is a pretty cool way to let program installers add support for their own formats without needing to write highly privileged kernel code.
258 | 
259 | ## In the End (Not the Linkin Park Song)
260 | 
261 | An exec syscall will always end up in one of two paths:
262 | 
263 | - It will eventually reach an executable binary format that it understands, perhaps after several layers of script interpreters, and run that code. At this point, the old code has been replaced.
264 | - ... or it will exhaust all its options and return an error code to the calling program, tail between its legs.
265 | 
266 | If you've ever used a Unix-like system, you might've noticed that shell scripts run from a terminal still execute if they don't have a shebang line or `.sh` extension. You can test this out right now if you have a non-Windows terminal handy:
267 | 
268 | <CodeBlock name='Shell session'>
269 | ```
270 | $ echo "echo hello" > ./file
271 | $ chmod +x ./file
272 | $ ./file
273 | hello
274 | ```
275 | </CodeBlock>
276 | 
277 | (`chmod +x` tells the OS that a file is an executable. You won't be able to run it otherwise.)
278 | 
279 | So, why does the shell script run as a shell script? The kernel's format handlers should have no clear way of detecting shell scripts without any discernible label!
280 | 
281 | Well, it turns out that this behavior isn't part of the kernel. It's actually a common way for your *shell* to handle a failure case.
282 | 
283 | When you execute a file using a shell and the exec syscall fails, most shells will *retry executing the file as a shell script* by executing a shell with the filename as the first argument. Bash will typically use itself as this interpreter, while ZSH uses whatever `sh` is, usually [Bourne shell](https://en.wikipedia.org/wiki/Bourne_shell).
284 | 
285 | This behavior is so common because it's specified in [*POSIX*](https://en.wikipedia.org/wiki/POSIX), an old standard designed to make code portable between Unix systems. While POSIX isn't strictly followed by most tools or operating systems, many of its conventions are still shared.
286 | 
287 | > If \[an exec syscall\] fails due to an error equivalent to the `[ENOEXEC]` error, **the shell shall execute a command equivalent to having a shell invoked with the command name as its first operand**, with any remaining arguments passed to the new shell. If the executable file is not a text file, the shell may bypass this command execution. In this case, it shall write an error message and shall return an exit status of 126.
288 | > 
289 | > *Source: <cite>[Shell Command Language, POSIX.1-2017](https://pubs.opengroup.org/onlinepubs/9699919799.2018edition/utilities/V3_chap02.html#tag_18_09_01_01)</cite>*
290 | 
291 | Computers are so cool!
292 | 


--------------------------------------------------------------------------------
/public/squiggles/bottom.svg:
--------------------------------------------------------------------------------
 1 | <svg width="1100" height="230" viewBox="0 0 1100 230" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M80.4156 71.8952V71.0386" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 3 | <path d="M80.844 70.6102C79.4023 71.8718 80.4971 78.4687 80.844 80.2031" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 4 | <path d="M88.1257 71.0384C88.1257 67.8843 88.5788 77.3336 88.9824 80.4617" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 5 | <path d="M96.2642 70.1818C95.4618 72.8896 95.8358 76.6875 95.8358 79.4757" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 6 | <path d="M103.974 70.6102C103.974 73.9691 103.599 76.3631 103.974 79.7346" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 7 | <path d="M111.256 70.1818V70.6101" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 8 | <path d="M111.256 70.6102V80.0336" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
 9 | <path d="M118.966 71.0386C117.369 72.0367 118.787 79.2534 118.966 80.5021" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
10 | <path d="M126.247 71.0386C125.161 74.2979 125.539 77.6223 125.391 81.0197" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
11 | <path d="M83.4141 135.289C83.3203 136.039 83.3387 136.484 83.3903 137.335C83.467 138.601 83.3869 139.875 83.4141 141.142C83.4593 143.253 83.8937 143.958 84.6991 145.569" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
12 | <path d="M92.8375 135.159C91.0388 138.382 91.4914 140.414 92.4091 143.855" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
13 | <path d="M99.6907 134.86C99.6907 138.12 100.014 141.083 100.547 144.284" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
14 | <path d="M109.681 135.273C107.959 137.64 109.523 143.661 110.399 145.997" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
15 | <path d="M117.253 136.574C117.253 139.121 118.199 141.444 118.966 143.855" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
16 | <path d="M128.389 135.717C127.97 138.808 128.14 141.602 128.389 144.712" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
17 | <path d="M65.2753 89.894C63.6038 89.894 67.2651 89.7384 67.6123 89.6776C70.3414 89.2 71.9386 89.1269 74.6233 89.894" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
18 | <path d="M66.0542 97.6841C65.4319 98.3952 69.2471 97.5772 69.7112 97.5109C72.1835 97.1578 73.5727 97.4389 75.7918 98.4631" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
19 | <path d="M66.0541 106.746C68.8928 105.734 73.3389 106.832 75.7917 105.967" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
20 | <path d="M67.1353 114.909C67.8626 115.16 69.6808 114.909 70.7717 114.909C73.6808 114.909 73.7159 114.968 76.6225 115.549" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
21 | <path d="M66.8333 124.17C69.5825 123.576 73.3518 123.689 76.0779 124.17" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
22 | <path d="M66.0541 131.96C69.3609 131.925 72.5212 131.493 75.7917 131.96" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
23 | <path d="M135.166 128.177C135.376 128.738 139.375 128.51 139.996 128.547C140.879 128.601 142.507 128.691 143.277 128.177" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
24 | <path d="M135.582 120.898C134.411 120.898 137.902 120.545 139.072 120.494C140.427 120.435 141.595 120.892 142.861 121.314" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
25 | <path d="M135.478 113.411C138.208 113.184 139.912 112.376 142.653 112.787" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
26 | <path d="M135.582 106.756C137.721 106.03 140.02 105.899 142.237 105.508" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
27 | <path d="M135.166 97.8133C133.145 97.8133 139.191 97.4283 141.198 97.1893" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
28 | <path d="M133.681 89.091C133.5 89.1111 134.365 88.5722 134.365 88.8023C134.365 89.1097 135.613 88.8339 135.74 88.8152C138.086 88.4702 140.191 88.3593 142.439 89.1623" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
29 | <path d="M97.3226 101.076C96.7504 101.394 96.4727 98.6256 97.8097 99.9625C98.3131 100.466 98.575 101.281 98.575 100.902C98.575 100.521 98.3873 97.8012 97.5662 99.1972C97.146 99.9114 96.8034 100.283 96.6269 101.145C96.5967 101.293 96.3091 103.277 96.6269 102.641C96.9879 101.919 96.9615 99.6353 97.9488 99.3885C98.3522 99.2877 98.2189 103.092 98.4184 103.372C98.5993 103.625 98.473 99.3556 98.1923 99.8233C97.6078 100.798 96.8115 103.798 98.575 102.328" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
30 | <path d="M108.594 102.944C107.598 102.82 108.859 99.9007 109.22 99.5004C110.426 98.16 110.51 101.65 110.159 102.353C109.923 102.825 110.159 101.298 110.159 100.77C110.159 100.204 110.165 99.6413 109.846 100.579C109.459 101.716 108.466 105.207 109.533 102.005" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
31 | <path d="M86.941 86.9331L87.1626 85.3823" stroke="#62686D" stroke-width="1.45455" stroke-linecap="round"/>
32 | <path d="M77.415 82.5023C76.596 82.5504 76.9049 83.0044 76.5904 83.5607C76.2826 84.1054 75.1295 85.3656 75.7412 85.2345C76.1429 85.1485 76.8164 84.2772 77.1197 84.0284C77.3384 83.8489 80.056 81.4189 79.6919 82.5515C79.045 84.5643 77.1616 86.0687 76.5043 88.0406C76.1076 89.2308 78.3926 86.3862 79.2858 85.5053C80.2425 84.5617 81.2359 83.6416 82.3503 82.8838C84.1753 81.6428 81.3219 85.6317 81.1319 85.8991C80.0863 87.3707 78.9627 88.8676 78.1781 90.5021C77.6341 91.6355 79.1827 90.3196 79.335 90.1575C80.6607 88.7472 81.7849 87.1508 83.1011 85.7268C83.4554 85.3435 85.5823 83.1176 84.7503 85.173C82.8489 89.8706 78.3058 93.318 76.6397 98.1082C76.1217 99.5974 78.5841 96.5805 78.6212 96.5328C79.9285 94.8505 81.2621 93.1766 82.5103 91.4498C83.4436 90.1588 84.2432 88.7277 85.2918 87.5237C86.1045 86.5907 85.764 87.7698 85.538 88.2622C83.5038 92.6937 80.6512 96.6442 78.1412 100.804C78.0746 100.914 75.801 104.833 76.1104 104.877C77.0713 105.015 79.4138 100.655 79.815 100.053C81.1736 98.0149 82.5782 96.0271 84.0857 94.0959C84.4622 93.6137 85.4027 92.0003 86.1288 91.8683C86.3196 91.8336 84.793 96.1004 84.7257 96.2621C83.4893 99.2315 81.9762 102.081 80.5288 104.951C79.3745 107.24 78.0442 109.453 76.9966 111.794C76.6929 112.473 76.4099 113.382 77.1566 112.274C79.8863 108.224 81.8718 103.558 84.9965 99.782C85.3274 99.3821 85.8959 98.8336 85.6611 99.7943C85.2237 101.584 84.3084 103.279 83.5688 104.951C82.142 108.177 80.6277 111.4 79.4704 114.736C79.0567 115.928 78.705 117.141 78.7442 118.416C78.7753 119.424 79.6068 117.64 79.6673 117.517C80.7825 115.247 82.0807 113.119 83.618 111.105C83.8417 110.812 87.2839 107.135 86.3011 109.16C83.8624 114.187 81.8294 119.29 80.1719 124.643C79.8273 125.756 79.3472 126.934 79.2242 128.102C79.0901 129.376 80.1674 125.716 80.7381 124.569C82.0673 121.898 83.7012 118.751 85.8334 116.619C86.5317 115.92 86.0201 116.969 85.8703 117.308C85.0034 119.266 83.9293 121.106 82.8796 122.969C80.8468 126.577 78.8078 130.217 77.0581 133.972C76.3665 135.457 76.8926 134.762 77.3904 133.948C79.6531 130.247 81.371 126.375 83.9626 122.871C84.2764 122.447 84.6961 121.605 85.2549 121.419C85.502 121.336 84.595 123.863 84.578 123.905C83.4142 126.729 81.9479 129.421 80.8488 132.274C80.829 132.325 80.0085 135.476 80.4427 134.957C82.0239 133.066 82.9687 130.299 84.1842 128.175C85.3648 126.112 86.6252 124.223 88.1718 122.428C88.5543 121.984 88.8416 121.62 88.541 122.502C87.8763 124.452 86.866 126.275 86.1041 128.188C85.3309 130.129 84.3565 132.481 84.3565 134.612C84.3565 135.971 85.6516 134.097 85.8334 133.898" stroke="#62686D" stroke-width="1.45455" stroke-linecap="round"/>
33 | <path d="M90.0424 124.594C89.6404 124.192 89.627 125.653 89.4516 126.194C88.839 128.083 87.9915 129.978 87.5563 131.917C87.5152 132.1 87.3565 133.187 87.8886 132.655C89.736 130.808 90.9922 128.031 92.4301 125.874C92.5576 125.683 95.8817 120.61 94.99 123.609C94.3493 125.765 93.0557 127.831 92.1593 129.886C91.685 130.974 90.4782 133.889 91.5562 133.394C92.962 132.748 93.947 130.328 94.707 129.135C95.8856 127.285 97.0419 125.268 98.5838 123.683C98.7824 123.479 99.6201 122.654 99.5192 123.486C99.3074 125.234 98.3976 127.046 97.6977 128.631C97.0239 130.157 96.0907 131.646 95.63 133.258C95.0524 135.28 95.9972 134.937 97.0085 133.64C98.3679 131.896 99.4321 129.939 100.75 128.163C101.127 127.654 103.521 123.922 104.504 124.225C105.382 124.495 98.1559 139.792 104.959 130.058C106.29 128.155 107.64 125.845 109.538 124.422C110.324 123.832 109.612 125.294 109.55 125.443C108.656 127.577 107.423 129.614 106.805 131.855C106.653 132.41 106.45 133.961 106.879 133.578C108.067 132.519 108.801 130.435 109.574 129.098C110.857 126.881 112.258 124.698 114.017 122.822C115.006 121.768 114.874 123.236 114.657 123.905C113.772 126.646 111.44 129.513 111.384 132.471C111.343 134.587 113.069 131.567 113.23 131.314C114.19 129.8 115.241 128.392 116.405 127.031C116.863 126.496 117.502 125.576 118.251 125.406C119.063 125.222 118.014 127.083 117.648 127.831C116.76 129.644 114.018 135.001 115.224 133.381C117.71 130.04 119.357 126.17 121.956 122.895C122.006 122.833 125.191 118.921 125.611 119.696C126.145 120.679 123.858 123.634 123.47 124.311C122.486 126.026 121.505 127.744 120.602 129.505C119.962 130.752 118.276 133.166 118.596 134.637C118.83 135.716 119.971 132.897 120.504 131.929C122.65 128.026 125.057 124.278 127.753 120.729C129.14 118.904 130.642 117.14 132.331 115.585C133.835 114.2 132.894 115.943 132.442 116.816C129.852 121.817 126.545 126.42 123.962 131.425C123.876 131.591 123.305 132.921 123.322 132.901C124.164 131.891 124.793 130.515 125.513 129.418C126.844 127.39 128.178 125.381 129.697 123.486C130.003 123.105 131.034 121.866 131.396 121.443C131.728 121.055 132.238 119.891 132.466 120.348C132.714 120.844 131.254 122.861 131.026 123.265C129.984 125.113 129.008 126.997 128.023 128.877C127.592 129.701 126.779 130.794 126.633 131.745C126.462 132.852 128.068 130.022 128.737 129.123C129.797 127.698 132.976 123.492 132.245 125.111C131.309 127.183 129.978 129.107 128.836 131.068C128.63 131.42 127.185 133.389 127.642 133.948C128.051 134.447 130.953 130.91 131.297 130.625C132.11 129.951 132.539 129.671 132.38 130.785C132.244 131.735 132.731 132.587 133.02 133.455" stroke="#62686D" stroke-width="1.45455" stroke-linecap="round"/>
34 | <path d="M127.039 84.053C125.481 86.2686 123.413 88.791 122.534 91.3883C122.205 92.3627 123.298 91.5553 123.519 91.2898C124.431 90.1952 125.079 88.9392 125.39 87.5483C125.71 86.1119 126.153 84.9314 127.027 83.7084C127.577 82.938 128.56 81.9236 128.097 83.5607C127.541 85.5279 126.344 87.3866 125.414 89.1852C124.403 91.1411 123.336 93.0963 122.485 95.1298C122.469 95.1682 121.398 97.4338 122.608 96.6928C124.169 95.7376 125.084 93.8015 126.005 92.299C127.506 89.8507 129.092 87.4509 130.842 85.173C131.035 84.9218 132.583 82.4956 133.143 82.6007C133.179 82.6074 129.301 89.3244 129.107 89.6406C127.426 92.3681 125.59 95.0947 124.344 98.059C124.325 98.1025 123.017 102.05 124.036 101.062C125.377 99.761 126.12 97.5046 126.953 95.8805C127.888 94.0572 128.855 92.2079 130.14 90.6006C130.593 90.0353 131.271 89.387 130.731 90.6498C129.819 92.7848 128.551 94.8126 127.494 96.8774C125.816 100.157 123.802 103.503 122.854 107.093C122.741 107.524 122.198 109.922 122.867 110.256C123.104 110.374 129.292 99.2991 130.116 98.0467C130.5 97.4623 131.184 95.9289 131.913 95.6221C132.141 95.526 130.596 99.3129 130.559 99.3882C129.038 102.467 127.54 105.538 126.153 108.68C125.097 111.071 123.82 113.542 123.371 116.151C123.086 117.811 124.294 115.464 124.405 115.265C126.14 112.174 127.893 108.994 130.214 106.293C130.277 106.22 132.151 104.222 132.307 104.533C132.692 105.304 130.769 108.161 130.497 108.693C129.184 111.263 127.449 113.985 126.916 116.865C126.566 118.755 127.717 117.983 128.811 117.505" stroke="#62686D" stroke-width="1.45455" stroke-linecap="round"/>
35 | <path d="M89.3778 82.0592C87.2171 81.7415 85.8738 86.8819 86.0671 88.7176C86.1057 89.085 86.3562 88.4627 86.3747 88.4345C87.0863 87.3524 87.9386 86.3413 88.7747 85.3576C88.8114 85.3144 93.2123 80.534 93.1685 82.1331C93.1143 84.1116 91.3949 86.2645 90.5839 87.9914C90.2986 88.599 89.6516 89.6724 89.7101 90.4037C89.8045 91.5836 91.4572 88.7904 92.1839 87.8561C93.8037 85.7734 95.2474 83.478 97.033 81.53C97.1812 81.3684 96.9354 81.9621 96.8361 82.1577C95.9111 83.9805 95.0846 85.8372 94.35 87.7453C94.2822 87.9213 93.2496 91.558 93.5623 91.3391C95.7164 89.8312 97.2451 86.9117 98.7315 84.8161C99.1807 84.1828 101.199 81.1522 100.295 83.7946C99.7497 85.3855 98.3178 87.7287 98.4361 89.4437C98.466 89.8777 99.321 89.208 99.6176 88.8899C100.874 87.5425 101.974 86.0392 103.113 84.5946C103.132 84.5703 106.271 80.6899 105.611 82.4654C104.9 84.381 103.872 86.1742 103.211 88.1145C103.095 88.4555 102.915 89.0333 103.458 88.5207C104.548 87.4908 105.433 86.2081 106.362 85.0376C106.832 84.4454 107.792 82.7818 108.614 82.5761C109.156 82.4408 107.752 84.7971 107.667 84.9638C107.477 85.3326 106.19 89.2714 106.707 89.0499C107.456 88.7288 108.275 87.3087 108.701 86.7607C109.746 85.415 110.788 84.0865 112.024 82.9084C115.133 79.9441 110.596 89.9432 110.842 90.0591C111.711 90.4682 113.58 87.2573 113.919 86.7853C114.659 85.7543 115.391 84.7148 116.27 83.7946C116.443 83.6134 116.945 83.1528 116.91 83.4007C116.692 84.9248 115.574 86.342 114.891 87.6838C114.662 88.1354 113.98 89.1074 114.485 89.1484C115.284 89.2131 116.656 86.8937 117.045 86.3915C117.979 85.1844 118.808 83.848 119.9 82.7731C120.82 81.8686 121.216 82.359 120.774 83.4623C119.955 85.5107 118.399 87.1902 117.624 89.2591C117.547 89.462 117.163 90.7144 117.956 90.0837C119.172 89.1157 120.043 87.6619 121.082 86.5145C122.056 85.4388 123.761 83.8499 125.377 84.3115C126.336 84.5854 122.584 89.5138 122.387 89.813" stroke="#62686D" stroke-width="1.45455" stroke-linecap="round"/>
36 | <path d="M88.4667 93.4567C88.3242 92.1741 88.4667 95.7141 88.4667 96.1002C88.4667 98.7729 88.2512 101.542 88.5242 104.203C88.9942 108.786 88.888 113.474 88.9839 118.082C89.0043 119.058 89.2425 119.998 89.2425 120.998C89.2425 122.588 89.7025 122.101 91.1964 121.961C95.6863 121.538 100.384 122.162 104.902 122.162C107.297 122.162 109.644 122.938 112 122.938C113.857 122.938 115.756 122.85 117.574 123.254C118.237 123.401 120.573 123.516 120.476 122.823C120.071 119.927 119.971 116.965 120.332 114.03C121.089 107.894 121.051 101.602 121.051 95.4106C121.051 94.4432 121.309 93.5189 121.309 92.566C121.309 91.9088 121.563 91.8744 120.735 91.9051C119.67 91.9445 118.639 92.1637 117.545 92.1637C116.098 92.1637 114.791 91.4534 113.35 91.3879C112.09 91.3306 110.878 90.8707 109.6 90.8707C107.783 90.8707 105.851 91.0468 104.04 90.8132C101.607 90.4992 99.1451 90.6375 96.7421 91.1867C95.2493 91.5279 93.3269 91.8219 91.8286 91.9051C90.3129 91.9893 89.3121 91.0975 88.2081 92.4223" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
37 | <path d="M75.237 80.6338C74.617 82.3169 75.237 84.9928 75.237 86.7905C75.237 90.9899 75.0482 95.238 75.324 99.4303C75.8958 108.122 77.5374 117.181 76.7599 125.928C76.7069 126.524 74.9551 137.371 75.4546 137.371C76.0728 137.371 77.0173 136.55 77.4996 136.24C79.5175 134.943 82.5663 135.321 84.8963 134.978C88.2163 134.49 90.9057 134.914 94.2075 135.043C97.2366 135.162 100.234 134.469 103.258 134.761C109.978 135.408 116.739 135.105 123.468 135.478C125.827 135.61 127.846 135.58 130.147 135.152C131.705 134.862 133.28 135.657 134.759 135.37C136.227 135.084 135.958 134.403 135.738 133.085C135.197 129.837 135.151 126.58 135.151 123.296C135.151 116.415 135.072 109.581 134.737 102.715C134.498 97.8022 133.584 92.9925 133.584 88.0741C133.584 86.4733 134.521 82.2002 132.409 82.2002C129.285 82.2002 126.303 81.6246 123.207 81.3953C115.032 80.7897 106.863 79.9534 98.6455 79.8507C95.984 79.8174 93.3611 80.1598 90.7049 80.264C88.5182 80.3498 86.1759 81.1925 84.0043 81.0037C80.7452 80.7203 76.7156 80.2861 73.6707 81.8086" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
38 | <path d="M95.8089 110.196C95.6292 110.176 95.4284 109.939 95.6067 110.039C96.229 110.389 96.6598 111.181 97.3141 111.578C99.0162 112.61 101.096 112.438 102.998 112.42C105.109 112.4 107.146 111.998 109.164 111.409C109.664 111.264 113.815 109.935 112.388 108.983" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
39 | <path d="M96.6176 111.41C96.0341 111.555 97.1022 113.622 97.3589 113.926C98.2338 114.96 99.4208 115.687 100.706 116.06C101.96 116.424 103.221 116.628 104.458 117.026C104.939 117.18 105.869 117.162 106.334 116.958C107.591 116.408 108.817 115.929 109.636 114.746C110.433 113.594 110.45 112.014 111.579 111.207" stroke="white" stroke-width="1.45455" stroke-linecap="round"/>
40 | <path d="M621.393 192.946C621.393 191.366 620.395 183.292 621.58 182.544C623.207 181.516 628.199 182.483 630.07 182.45C634.86 182.367 641.972 181.417 645.558 177.832C647.455 175.934 646.937 173.3 647.004 170.881C647.046 169.378 647.987 169.435 649.196 169.435C651.976 169.435 654.861 169.566 657.173 167.756C660.612 165.065 660.859 160.032 660.859 156" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
41 | <path d="M450.443 196.813C448.274 194.807 446.105 192.801 443.936 190.794C439.754 186.926 437.4 181.516 436.034 176.049C435.517 173.982 434.317 170.823 435.721 168.865C437.061 166.996 438.763 166.186 440.959 166.878C442.925 167.498 447.538 170.494 447.892 172.847C448.281 175.429 444.098 176.195 442.349 175.886C435.269 174.633 427.103 166.244 427.555 158.801C427.782 155.071 429.251 151.591 429.825 148" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
42 | <path d="M272.062 141.325C272.793 143.245 273.419 145.141 274.549 146.787C275.244 147.799 274.825 147.463 274.984 146.584C275.117 145.851 274.908 144.571 274.688 143.867C274.412 142.983 273.81 142.451 273.16 141.788C272.93 141.554 271.948 141.338 272.167 141.116" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
43 | <path d="M286.374 135.898C286.892 137.26 287.409 138.621 287.927 139.982C288.075 140.372 288.122 140.383 288.525 140.448C288.769 140.487 289.096 141.246 289.008 141.014C288.381 139.365 287.8 137.919 287.649 136.183C287.598 135.594 287.744 135.655 287.38 135.602C287.043 135.552 286.858 135.316 286.502 135.33" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
44 | <path d="M275.513 157.449C276.603 160.316 281.052 162.364 284.026 162.87C286.654 163.317 288.827 162.53 291.364 161.565C294.942 160.204 296.252 157.917 298.558 155.038C299.808 153.477 298.07 147.356 297.252 149.181" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
45 | <path d="M765 187.638C768.462 187.638 771.925 187.638 775.387 187.638C777.657 187.638 785.316 186.298 787.048 188.03C790.651 191.634 786.627 204.616 780.434 200.328C775.042 196.595 776.308 187.315 780.14 183.229C786.551 176.39 795.059 174.369 802.922 170" stroke="white" stroke-width="1.56" stroke-linecap="round"/>
46 | <path d="M1033.12 121.898C1032.37 122.312 1031.87 123.098 1031.51 123.846C1030.42 126.139 1029.59 128.555 1028.5 130.853C1025.11 137.988 1020.46 144.428 1016.92 151.491C1015.06 155.2 1013.38 158.902 1011.18 162.43C1009.66 164.872 1008.72 167.607 1007.26 170.084C1007.14 170.301 1005.91 172.116 1006.1 172.108C1006.57 172.089 1007.35 173.038 1007.64 173.302C1009.19 174.682 1010.63 175.683 1012.69 176.163C1016.06 176.947 1019.79 177.537 1022.95 179.038C1023.62 179.359 1026.31 181.474 1026.07 181.176" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
47 | <path d="M1025.13 180.88C1023.84 181.397 1024.94 179.893 1025.26 179.228C1027.22 175.096 1028.88 170.818 1030.68 166.61C1033.96 158.901 1037.57 151.268 1041.17 143.697C1043.32 139.173 1045.81 134.391 1048.67 130.28C1048.91 129.946 1052.27 124.894 1051.2 124.999C1049.26 125.19 1047.63 124.541 1045.87 123.706C1044.46 123.036 1042.59 123.045 1041.32 122.175C1040.17 121.382 1039.51 121.162 1038.13 121.011C1037.36 120.927 1035.55 120.351 1034.97 119.924C1034.57 119.624 1034.41 119.246 1033.89 119.073C1033.31 118.884 1032.45 121.401 1032.24 121.839" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
48 | <path d="M1049.47 129.673C1051.68 130.724 1053.62 131.645 1055.79 132.678" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
49 | <path d="M1046.42 133.759C1049 133.405 1051.05 134.952 1053.13 135.944" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
50 | <path d="M1044.28 138.275C1046.4 139.287 1048.44 140.255 1050.6 141.28" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
51 | <path d="M1042.56 141.888C1044.7 142.907 1047.08 143.209 1049.31 143.99" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
52 | <path d="M1045.56 135.566C1047.24 136.364 1049.91 137.632 1051.89 138.571" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
53 | <path d="M1040.84 145.5C1043.38 145.72 1045.04 146.391 1047.59 147.602" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
54 | <path d="M1039.87 148.36C1038.04 147.489 1044.71 150.663 1045.87 151.215" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
55 | <path d="M1037.84 151.822C1040.05 152.873 1042.18 153.39 1044.59 153.924" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
56 | <path d="M1036.55 154.532C1038.65 155.533 1040.73 156.519 1042.87 157.537" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
57 | <path d="M1034.4 159.047C1036.61 159.748 1039.08 160.163 1041.15 161.15" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
58 | <path d="M1033.11 161.757C1035.24 162.768 1037.28 163.737 1039.43 164.762" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
59 | <path d="M1031.83 164.466C1031.99 166.075 1036.18 167.565 1037.75 168.311" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
60 | <path d="M1029.1 168.707C1027.13 167.773 1034.68 171.358 1036 171.987" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
61 | <path d="M1028.43 173.927C1030.2 173.914 1032.48 174.978 1034.28 175.6" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
62 | <path d="M1026.72 177.54C1027.86 177.932 1030.46 178.5 1031.66 178.783" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
63 | <path d="M1001.4 166.609C999.418 165.668 1005.35 168.586 1007.75 168.524" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
64 | <path d="M1003.19 164.142C1003.49 164.285 1007.69 166.281 1008.61 166.718" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
65 | <path d="M1002.24 161.477C1004.91 162.167 1007.36 162.803 1009.9 164.008" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
66 | <path d="M1005.77 158.719C1005.7 158.684 1009.74 160.75 1011.62 160.396" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
67 | <path d="M1007.48 155.11C1007.66 155.192 1011.79 157.158 1012.9 157.686" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
68 | <path d="M1009.2 151.498L1014.62 154.074" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
69 | <path d="M1010.49 148.788C1012.32 149.661 1014.02 150.467 1015.91 151.364" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
70 | <path d="M1012.21 145.176L1017.63 147.752" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
71 | <path d="M1013.92 142.422C1012.08 141.952 1018.22 144.895 1020.25 144.568" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
72 | <path d="M1015.21 138.854C1016.86 139.635 1020.29 141.268 1021.53 141.859" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
73 | <path d="M1017.83 135.67C1019.96 136.681 1021.95 137.625 1024.15 138.676" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
74 | <path d="M1017.74 131.199C1018.65 131.63 1023.19 133.786 1025.87 135.063" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
75 | <path d="M1022.17 128.874C1023.89 129.693 1025.82 130.609 1027.59 131.45" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
76 | <path d="M1022.51 123.5C1023.58 125.878 1027.34 126.6 1029.42 127.592" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
77 | <path d="M1025.15 121.435C1027.01 122.453 1029.21 123.555 1030.59 125.128" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
78 | <path d="M1025.99 118.51C1028.16 119.541 1030.19 120.505 1032.31 121.516" stroke="white" stroke-width="1.5" stroke-linecap="round"/>
79 | <path d="M917.443 130.813C915.274 128.807 913.105 126.801 910.936 124.794C906.754 120.926 904.4 115.516 903.034 110.049C902.517 107.982 901.317 104.823 902.721 102.865C904.061 100.996 905.763 100.186 907.959 100.878C909.925 101.498 914.538 104.494 914.892 106.847C915.281 109.429 911.098 110.195 909.349 109.886C902.269 108.633 894.103 100.244 894.555 92.8005C894.782 89.0713 896.251 85.5914 896.825 82" stroke="white" stroke-width="1.5625" stroke-linecap="round"/>
80 | <path d="M768.098 82C768.44 83.6399 767.282 85.4844 766.903 87.0515C766.255 89.7305 765.79 92.4554 765.087 95.1192C764.726 96.4878 764.306 97.8844 763.681 99.1598C763.505 99.5192 762.987 100.627 763.073 101.035C763.075 101.046 766.453 98.3273 766.896 97.74C767.639 96.756 768.7 96.2982 769.551 95.5626C770.023 95.1549 769.366 96.513 769.284 96.7426C768.964 97.6394 768.427 98.5376 768.304 99.5006C768.034 101.625 767.627 103.697 767.178 105.815C766.751 107.828 766.197 109.839 765.89 111.885C765.756 112.776 765.573 115.426 765.389 114.543" stroke="white" stroke-width="1.56" stroke-linecap="round"/>
81 | </svg>
82 | 


--------------------------------------------------------------------------------