From f3d5cf8e68cc4f9dd9b0ed7e052852373b62b365 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sat, 4 May 2024 23:54:01 +0200 Subject: [PATCH 1/8] Add Typescript for type checking (but still with js files) (#81) * Emit types using tsc --- .eslintrc.json | 3 ++- .gitignore | 1 + index.d.ts | 54 +++++++++++++++++++++++++++++++++++++++++++++++ index.js | 12 +++++++++++ lib/mocompiler.js | 11 +++++----- lib/moparser.js | 2 +- lib/pocompiler.js | 2 +- lib/poparser.js | 8 +++---- lib/shared.js | 6 +++--- package.json | 13 ++++++++++-- tsconfig.json | 36 +++++++++++++++++++++++++++++++ 11 files changed, 131 insertions(+), 17 deletions(-) create mode 100644 index.d.ts create mode 100644 tsconfig.json diff --git a/.eslintrc.json b/.eslintrc.json index 30149ce..bcfae6d 100644 --- a/.eslintrc.json +++ b/.eslintrc.json @@ -3,7 +3,8 @@ "es2021": true, "node": true }, - "extends": "standard", + "extends": ["eslint:recommended", "plugin:@typescript-eslint/recommended"], + "parser": "@typescript-eslint/parser", "parserOptions": { "ecmaVersion": "latest", "sourceType": "module" diff --git a/.gitignore b/.gitignore index 61b7f20..6fc64df 100644 --- a/.gitignore +++ b/.gitignore @@ -1,3 +1,4 @@ /node_modules +/@types npm-debug.log .DS_Store diff --git a/index.d.ts b/index.d.ts new file mode 100644 index 0000000..d47b72b --- /dev/null +++ b/index.d.ts @@ -0,0 +1,54 @@ +import { Transform } from "readable-stream"; + +import {Buffer} from "safe-buffer"; + +export declare module 'encoding' { + export function convert(buf: Buffer, toCharset: string, fromCharset: string): Buffer; +} + +export interface Compiler { + _table: GetTextTranslations; + compile(): Buffer; +} + +export interface GetTextComment { + translator?: string; + reference?: string; + extracted?: string; + flag?: string; + previous?: string; +} + +export interface GetTextTranslation { + msgctxt?: string; + msgid: string; + msgid_plural?: string; + msgstr: string[]; + comments?: GetTextComment; +} + +export interface GetTextTranslations { + charset: string; + headers: { [headerName: string]: string }; + translations: { [msgctxt: string]: { [msgId: string]: GetTextTranslation } }; +} + +export interface parserOptions { + defaultCharset?: string; + validation?: boolean; +} + +export interface po { + parse: (buffer: Buffer | string, defaultCharset?: string) => GetTextTranslations; + compile: (table: GetTextTranslations, options?: parserOptions) => Buffer; + createParseStream: (options?: parserOptions, transformOptions?: import('readable-stream').TransformOptions) => Transform; +} + +export interface mo { + parse: (buffer: Buffer | string, defaultCharset?: string) => GetTextTranslations; + compile: (table: GetTextTranslations, options?: parserOptions) => Buffer; +} + +export * from "./@types"; + +export default { po, mo } as { po: po, mo: mo }; diff --git a/index.js b/index.js index fab9b44..1f5a96c 100644 --- a/index.js +++ b/index.js @@ -3,12 +3,24 @@ import poCompiler from './lib/pocompiler.js'; import moParser from './lib/moparser.js'; import moCompiler from './lib/mocompiler.js'; +/** + * Translation parser and compiler for PO files + * @see https://www.gnu.org/software/gettext/manual/html_node/PO.html + * + * @type {import("./index.d.ts").po} po + */ export const po = { parse: poParser.parse, createParseStream: poParser.stream, compile: poCompiler }; +/** + * Translation parser and compiler for PO files + * @see https://www.gnu.org/software/gettext/manual/html_node/MO.html + * + * @type {import("./index.d.ts").mo} mo + */ export const mo = { parse: moParser, compile: moCompiler diff --git a/lib/mocompiler.js b/lib/mocompiler.js index 9715d63..9e8747d 100644 --- a/lib/mocompiler.js +++ b/lib/mocompiler.js @@ -7,20 +7,21 @@ import contentType from 'content-type'; * Exposes general compiler function. Takes a translation * object as a parameter and returns binary MO object * - * @param {Object} table Translation object + * @param {import('./index.d.ts').GetTextTranslations} table Translation object * @return {Buffer} Compiled binary MO object */ export default function (table) { const compiler = new Compiler(table); return compiler.compile(); -}; +} /** * Creates a MO compiler object. * * @constructor - * @param {Object} table Translation table as defined in the README + * @param {import('./index.d.ts').GetTextTranslations} table Translation table as defined in the README + * @return {import('./index.d.ts').Compiler} Compiler */ function Compiler (table = {}) { this._table = table; @@ -148,7 +149,7 @@ Compiler.prototype._generateList = function () { /** * Calculate buffer size for the final binary object * - * @param {Array} list An array of translation strings from _generateList + * @param {import('./index.d.ts').GetTextTranslations} list An array of translation strings from _generateList * @return {Object} Size data of {msgid, msgstr, total} */ Compiler.prototype._calculateSize = function (list) { @@ -183,7 +184,7 @@ Compiler.prototype._calculateSize = function (list) { /** * Generates the binary MO object from the translation list * - * @param {Array} list translation list + * @param {import('./index.d.ts').GetTextTranslations} list translation list * @param {Object} size Byte size information * @return {Buffer} Compiled MO object */ diff --git a/lib/moparser.js b/lib/moparser.js index 09c10f8..0054710 100644 --- a/lib/moparser.js +++ b/lib/moparser.js @@ -12,7 +12,7 @@ export default function (buffer, defaultCharset) { const parser = new Parser(buffer, defaultCharset); return parser.parse(); -}; +} /** * Creates a MO parser object. diff --git a/lib/pocompiler.js b/lib/pocompiler.js index f4baa0a..c08671b 100644 --- a/lib/pocompiler.js +++ b/lib/pocompiler.js @@ -14,7 +14,7 @@ export default function (table, options) { const compiler = new Compiler(table, options); return compiler.compile(); -}; +} /** * Creates a PO compiler object. diff --git a/lib/poparser.js b/lib/poparser.js index 77b8b12..70cce36 100644 --- a/lib/poparser.js +++ b/lib/poparser.js @@ -14,18 +14,18 @@ export function parse (input, options = {}) { const parser = new Parser(input, options); return parser.parse(); -}; +} /** * Parses a PO stream, emits translation table in object mode * - * @typedef {{ defaultCharset: strubg, validation: boolean }} Options + * @typedef {{ defaultCharset: string, validation: boolean }} Options * @param {Options} [options] Optional options with defaultCharset and validation * @param {import('readable-stream').TransformOptions} [transformOptions] Optional stream options */ export function stream (options = {}, transformOptions = {}) { return new PoParserTransform(options, transformOptions); -}; +} /** * Creates a PO parser object. If PO object is a string, @@ -515,7 +515,7 @@ Parser.prototype._finalize = function (tokens) { /** * Creates a transform stream for parsing PO input * - * @typedef {{ defaultCharset: strubg, validation: boolean }} Options + * @typedef {{ defaultCharset: string, validation: boolean }} Options * @constructor * @param {Options} options Optional options with defaultCharset and validation * @param {import('readable-stream').TransformOptions} transformOptions Optional stream options diff --git a/lib/shared.js b/lib/shared.js index 8cf706c..5e2d3a5 100644 --- a/lib/shared.js +++ b/lib/shared.js @@ -45,8 +45,8 @@ export function parseHeader (str = '') { * @param {Object} [headers = {}] An object with parsed headers * @returns {number} Parsed result */ -export function parseNPluralFromHeadersSafely (headers = {}, fallback = 1) { - const pluralForms = headers[PLURAL_FORMS]; +export function parseNPluralFromHeadersSafely (headers, fallback = 1) { + const pluralForms = headers ? headers[PLURAL_FORMS] : false; if (!pluralForms) { return fallback; @@ -101,7 +101,7 @@ export function formatCharset (charset = 'iso-8859-1', defaultCharset = 'iso-885 * * @param {String} str PO formatted string to be folded * @param {Number} [maxLen=76] Maximum allowed length for folded lines - * @return {Array} An array of lines + * @return {string[]} An array of lines */ export function foldLine (str, maxLen = 76) { const lines = []; diff --git a/package.json b/package.json index d01f014..dfc5bba 100644 --- a/package.json +++ b/package.json @@ -22,9 +22,11 @@ "test-generate-mo": "msgfmt test/fixtures/latin13.po -o test/fixtures/latin13.mo & msgfmt test/fixtures/utf8.po -o test/fixtures/utf8.mo & msgfmt test/fixtures/obsolete.po -o test/fixtures/obsolete.mo", "test": "mocha", "preversion": "npm run lint && npm test", - "postversion": "git push && git push --tags" + "postversion": "git push && git push --tags", + "prepublish": "tsc && npm run lint && npm run test" }, "main": "./index.js", + "types": "./index.d.ts", "license": "MIT", "dependencies": { "content-type": "^1.0.5", @@ -33,13 +35,20 @@ "safe-buffer": "^5.2.1" }, "devDependencies": { + "@types/chai": "latest", + "@types/content-type": "^1.1.8", + "@types/mocha": "latest", + "@types/readable-stream": "^4.0.11", + "@typescript-eslint/eslint-plugin": "^6.18.1", + "@typescript-eslint/parser": "^6.14.0", "chai": "^5.0.3", "eslint": "^8.56.0", "eslint-config-standard": "^17.1.0", "eslint-plugin-import": "^2.29.1", "eslint-plugin-n": "^16.6.2", "eslint-plugin-promise": "^6.1.1", - "mocha": "^10.3.0" + "mocha": "^10.3.0", + "typescript": "^5.4.4" }, "keywords": [ "i18n", diff --git a/tsconfig.json b/tsconfig.json new file mode 100644 index 0000000..1564f0f --- /dev/null +++ b/tsconfig.json @@ -0,0 +1,36 @@ +{ + "compilerOptions": { + "noImplicitAny": true, + "removeComments": false, + "module": "Node16", + "moduleResolution": "Node16", + "target": "ES2015", + + // Strict mode + "strict": true, + + // Allow javascript files + "allowJs": true, + + // Check js files for errors + "checkJs": false, + + // Output d.ts files to @types + "outDir": "@types", + + // Generate d.ts files + "declaration": true, + + // This compiler run should + // only output d.ts files + "emitDeclarationOnly": true, + // Minify + "pretty": false, + // Skip lib check when compiling + "skipLibCheck": true + }, + "include": [ + "lib/**/*.js", + "index.d.ts" + ] +} From 9e477d8917880bfdaec07476963e258adeb7afc4 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sat, 4 May 2024 23:56:19 +0200 Subject: [PATCH 2/8] Replaces deprecations (substr, slice) with the modern syntax (#84) * Update deprecated code --- lib/moparser.js | 10 ++++++++-- lib/poparser.js | 14 +++++++------- 2 files changed, 15 insertions(+), 9 deletions(-) diff --git a/lib/moparser.js b/lib/moparser.js index 0054710..43097cf 100644 --- a/lib/moparser.js +++ b/lib/moparser.js @@ -87,14 +87,20 @@ Parser.prototype._loadTranslationTable = function () { offsetOriginals += 4; position = this._fileContents[this._readFunc](offsetOriginals); offsetOriginals += 4; - msgid = this._fileContents.slice(position, position + length); + msgid = this._fileContents.subarray( + position, + position + length, + ); // matching msgstr length = this._fileContents[this._readFunc](offsetTranslations); offsetTranslations += 4; position = this._fileContents[this._readFunc](offsetTranslations); offsetTranslations += 4; - msgstr = this._fileContents.slice(position, position + length); + msgstr = this._fileContents.subarray( + position, + position + length, + ); if (!i && !msgid.toString()) { this._handleCharset(msgstr); diff --git a/lib/poparser.js b/lib/poparser.js index 70cce36..a9803e1 100644 --- a/lib/poparser.js +++ b/lib/poparser.js @@ -77,8 +77,8 @@ Parser.prototype._handleCharset = function (buf = '') { let match; if ((pos = str.search(/^\s*msgid/im)) >= 0) { - pos = pos + str.substr(pos + 5).search(/^\s*(msgid|msgctxt)/im); - headers = str.substr(0, pos >= 0 ? pos + 5 : str.length); + pos = pos + str.substring(pos + 5).search(/^\s*(msgid|msgctxt)/im); + headers = str.substring(0, pos >= 0 ? pos + 5 : str.length); } if ((match = headers.match(/[; ]charset\s*=\s*([\w-]+)(?:[\s;]|\\n)*"\s*$/mi))) { @@ -279,16 +279,16 @@ Parser.prototype._parseComments = function (tokens) { lines.forEach(line => { switch (line.charAt(0) || '') { case ':': - comment.reference.push(line.substr(1).trim()); + comment.reference.push(line.substring(1).trim()); break; case '.': - comment.extracted.push(line.substr(1).replace(/^\s+/, '')); + comment.extracted.push(line.substring(1).replace(/^\s+/, '')); break; case ',': - comment.flag.push(line.substr(1).replace(/^\s+/, '')); + comment.flag.push(line.substring(1).replace(/^\s+/, '')); break; case '|': - comment.previous.push(line.substr(1).replace(/^\s+/, '')); + comment.previous.push(line.substring(1).replace(/^\s+/, '')); break; case '~': break; @@ -392,7 +392,7 @@ Parser.prototype._handleValues = function (tokens) { curContext = false; curComments = false; - } else if (tokens[i].key.substr(0, 6).toLowerCase() === 'msgstr') { + } else if (tokens[i].key.substring(0, 6).toLowerCase() === 'msgstr') { if (lastNode) { lastNode.msgstr = (lastNode.msgstr || []).concat(tokens[i].value); } From 052d3d2a85dd6fbc4c44aa85313ec4ea6b23a34e Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sun, 5 May 2024 00:52:53 +0200 Subject: [PATCH 3/8] Move files from lib to src and index into src (#85) * move lib to src * path updates - as suggested by @johnhooks to set as source for tests the "src" folder (and not the builded one) - updated node internal modules paths prefix (ref. https://nodejs.org/api/module.html#modules-nodemodule-api) * typescript file compilation config --- .gitignore | 1 + .npmignore | 1 + package.json | 8 ++++---- index.d.ts => src/index.d.ts | 0 index.js => src/index.js | 8 ++++---- {lib => src}/mocompiler.js | 0 {lib => src}/moparser.js | 0 {lib => src}/pocompiler.js | 0 {lib => src}/poparser.js | 0 {lib => src}/shared.js | 0 test/mo-compiler-test.js | 10 +++++----- test/mo-parser-test.js | 10 +++++----- test/module.mjs | 2 +- test/po-compiler-test.js | 12 ++++++------ test/po-obsolete-test.js | 12 ++++++------ test/po-parser-test.js | 10 +++++----- test/shared.js | 12 +++++------- tsconfig.json | 11 ++++++----- 18 files changed, 49 insertions(+), 48 deletions(-) rename index.d.ts => src/index.d.ts (100%) rename index.js => src/index.js (74%) rename {lib => src}/mocompiler.js (100%) rename {lib => src}/moparser.js (100%) rename {lib => src}/pocompiler.js (100%) rename {lib => src}/poparser.js (100%) rename {lib => src}/shared.js (100%) diff --git a/.gitignore b/.gitignore index 6fc64df..ee8dea8 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,5 @@ /node_modules +/lib /@types npm-debug.log .DS_Store diff --git a/.npmignore b/.npmignore index f3611ac..478b410 100644 --- a/.npmignore +++ b/.npmignore @@ -1,3 +1,4 @@ /test +/src .eslintrc.js .gitignore diff --git a/package.json b/package.json index dfc5bba..d279a33 100644 --- a/package.json +++ b/package.json @@ -18,15 +18,15 @@ "node": ">=18" }, "scripts": { - "lint": "eslint lib/*.js test/*.js index.js", + "lint": "eslint src/*.js test/*.js", "test-generate-mo": "msgfmt test/fixtures/latin13.po -o test/fixtures/latin13.mo & msgfmt test/fixtures/utf8.po -o test/fixtures/utf8.mo & msgfmt test/fixtures/obsolete.po -o test/fixtures/obsolete.mo", "test": "mocha", "preversion": "npm run lint && npm test", "postversion": "git push && git push --tags", "prepublish": "tsc && npm run lint && npm run test" }, - "main": "./index.js", - "types": "./index.d.ts", + "main": "./lib/index.js", + "types": "./lib/index.d.ts", "license": "MIT", "dependencies": { "content-type": "^1.0.5", @@ -48,7 +48,7 @@ "eslint-plugin-n": "^16.6.2", "eslint-plugin-promise": "^6.1.1", "mocha": "^10.3.0", - "typescript": "^5.4.4" + "typescript": "^5.4.5" }, "keywords": [ "i18n", diff --git a/index.d.ts b/src/index.d.ts similarity index 100% rename from index.d.ts rename to src/index.d.ts diff --git a/index.js b/src/index.js similarity index 74% rename from index.js rename to src/index.js index 1f5a96c..05e32a3 100644 --- a/index.js +++ b/src/index.js @@ -1,7 +1,7 @@ -import * as poParser from './lib/poparser.js'; -import poCompiler from './lib/pocompiler.js'; -import moParser from './lib/moparser.js'; -import moCompiler from './lib/mocompiler.js'; +import * as poParser from './poparser.js'; +import poCompiler from './pocompiler.js'; +import moParser from './moparser.js'; +import moCompiler from './mocompiler.js'; /** * Translation parser and compiler for PO files diff --git a/lib/mocompiler.js b/src/mocompiler.js similarity index 100% rename from lib/mocompiler.js rename to src/mocompiler.js diff --git a/lib/moparser.js b/src/moparser.js similarity index 100% rename from lib/moparser.js rename to src/moparser.js diff --git a/lib/pocompiler.js b/src/pocompiler.js similarity index 100% rename from lib/pocompiler.js rename to src/pocompiler.js diff --git a/lib/poparser.js b/src/poparser.js similarity index 100% rename from lib/poparser.js rename to src/poparser.js diff --git a/lib/shared.js b/src/shared.js similarity index 100% rename from lib/shared.js rename to src/shared.js diff --git a/test/mo-compiler-test.js b/test/mo-compiler-test.js index 4796425..3b0a8b6 100644 --- a/test/mo-compiler-test.js +++ b/test/mo-compiler-test.js @@ -1,9 +1,9 @@ +import { promisify } from 'node:util'; +import path from 'node:path'; +import { mo } from '../src/index.js'; +import { readFile as fsReadFile } from 'node:fs'; +import { fileURLToPath } from 'node:url'; import * as chai from 'chai'; -import { promisify } from 'util'; -import path from 'path'; -import { mo } from '../index.js'; -import { readFile as fsReadFile } from 'fs'; -import { fileURLToPath } from 'url'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/test/mo-parser-test.js b/test/mo-parser-test.js index 723368a..4391471 100644 --- a/test/mo-parser-test.js +++ b/test/mo-parser-test.js @@ -1,9 +1,9 @@ +import { promisify } from 'node:util'; +import path from 'node:path'; +import { readFile as fsReadFile } from 'node:fs'; +import { fileURLToPath } from 'node:url'; import * as chai from 'chai'; -import { promisify } from 'util'; -import path from 'path'; -import { mo } from '../index.js'; -import { readFile as fsReadFile } from 'fs'; -import { fileURLToPath } from 'url'; +import { mo } from '../src/index.js'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/test/module.mjs b/test/module.mjs index 1796fd6..b1b48b0 100644 --- a/test/module.mjs +++ b/test/module.mjs @@ -1,5 +1,5 @@ import { expect } from 'chai'; -import { po, mo } from '../index.js'; +import { po, mo } from '../src/index.js'; describe('esm module', () => { it('should allow named imports', () => { diff --git a/test/po-compiler-test.js b/test/po-compiler-test.js index 18ad149..0e969ce 100644 --- a/test/po-compiler-test.js +++ b/test/po-compiler-test.js @@ -1,10 +1,10 @@ -import { EOL } from 'os'; -import { promisify } from 'util'; -import path from 'path'; -import { readFile as fsReadFile } from 'fs'; +import { readFile as fsReadFile } from 'node:fs'; +import { promisify } from 'node:util'; +import path from 'node:path'; +import { EOL } from 'node:os'; +import { fileURLToPath } from 'node:url'; +import { po } from '../src/index.js'; import * as chai from 'chai'; -import { po } from '../index.js'; -import { fileURLToPath } from 'url'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/test/po-obsolete-test.js b/test/po-obsolete-test.js index f0e696f..d8a4a18 100644 --- a/test/po-obsolete-test.js +++ b/test/po-obsolete-test.js @@ -1,10 +1,10 @@ -import { EOL } from 'os'; +import { EOL } from 'node:os'; +import path from 'node:path'; +import fs from 'node:fs'; +import { promisify } from 'node:util'; import * as chai from 'chai'; -import { promisify } from 'util'; -import path from 'path'; -import fs from 'fs'; -import * as gettextParser from '../index.js'; -import { fileURLToPath } from 'url'; +import * as gettextParser from '../src/index.js'; +import { fileURLToPath } from 'node:url'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/test/po-parser-test.js b/test/po-parser-test.js index 3a006c1..644e222 100644 --- a/test/po-parser-test.js +++ b/test/po-parser-test.js @@ -1,9 +1,9 @@ import * as chai from 'chai'; -import { promisify } from 'util'; -import path from 'path'; -import fs from 'fs'; -import * as gettextParser from '../index.js'; -import { fileURLToPath } from 'url'; +import { promisify } from 'node:util'; +import path from 'node:path'; +import fs from 'node:fs'; +import * as gettextParser from '../src/index.js'; +import { fileURLToPath } from 'node:url'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/test/shared.js b/test/shared.js index c40dfd6..0263c02 100644 --- a/test/shared.js +++ b/test/shared.js @@ -1,11 +1,9 @@ -'use strict'; - +import { promisify } from 'node:util'; +import path from 'node:path'; +import { readFile as fsReadFile } from 'node:fs'; +import { fileURLToPath } from 'node:url'; import * as chai from 'chai'; -import { promisify } from 'util'; -import path from 'path'; -import { formatCharset, parseHeader, generateHeader, foldLine, parseNPluralFromHeadersSafely } from '../lib/shared.js'; -import { readFile as fsReadFile } from 'fs'; -import { fileURLToPath } from 'url'; +import { formatCharset, parseHeader, generateHeader, foldLine, parseNPluralFromHeadersSafely } from '../src/shared.js'; const __filename = fileURLToPath(import.meta.url); const __dirname = path.dirname(__filename); diff --git a/tsconfig.json b/tsconfig.json index 1564f0f..96e5c6b 100644 --- a/tsconfig.json +++ b/tsconfig.json @@ -15,22 +15,23 @@ // Check js files for errors "checkJs": false, + // the directory sources are in + "rootDir": "src", + // Output d.ts files to @types - "outDir": "@types", + "outDir": "lib", // Generate d.ts files "declaration": true, - // This compiler run should - // only output d.ts files - "emitDeclarationOnly": true, // Minify "pretty": false, + // Skip lib check when compiling "skipLibCheck": true }, "include": [ - "lib/**/*.js", + "src/**/*.js", "index.d.ts" ] } From d18bbdbe88ad5216f308e47b9069d2e901c452aa Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sun, 5 May 2024 20:43:03 +0200 Subject: [PATCH 4/8] removes safe-buffer (not needed anymore) (#87) --- package.json | 3 +-- src/index.d.ts | 2 -- src/mocompiler.js | 1 - src/pocompiler.js | 1 - 4 files changed, 1 insertion(+), 6 deletions(-) diff --git a/package.json b/package.json index d279a33..e0115d5 100644 --- a/package.json +++ b/package.json @@ -31,8 +31,7 @@ "dependencies": { "content-type": "^1.0.5", "encoding": "^0.1.13", - "readable-stream": "^4.5.2", - "safe-buffer": "^5.2.1" + "readable-stream": "^4.5.2" }, "devDependencies": { "@types/chai": "latest", diff --git a/src/index.d.ts b/src/index.d.ts index d47b72b..8adf7ea 100644 --- a/src/index.d.ts +++ b/src/index.d.ts @@ -1,7 +1,5 @@ import { Transform } from "readable-stream"; -import {Buffer} from "safe-buffer"; - export declare module 'encoding' { export function convert(buf: Buffer, toCharset: string, fromCharset: string): Buffer; } diff --git a/src/mocompiler.js b/src/mocompiler.js index 9e8747d..229904d 100644 --- a/src/mocompiler.js +++ b/src/mocompiler.js @@ -1,4 +1,3 @@ -import { Buffer } from 'safe-buffer'; import encoding from 'encoding'; import { HEADERS, formatCharset, generateHeader, compareMsgid } from './shared.js'; import contentType from 'content-type'; diff --git a/src/pocompiler.js b/src/pocompiler.js index c08671b..024492c 100644 --- a/src/pocompiler.js +++ b/src/pocompiler.js @@ -1,4 +1,3 @@ -import { Buffer } from 'safe-buffer'; import encoding from 'encoding'; import { HEADERS, foldLine, compareMsgid, formatCharset, generateHeader } from './shared.js'; import contentType from 'content-type'; From 2f94ed77bb4eca871fc435a85ce2fecbb8240447 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sun, 5 May 2024 20:58:57 +0200 Subject: [PATCH 5/8] speed up lexer parsing (#88) * speed up lexer parsing --- src/poparser.js | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/src/poparser.js b/src/poparser.js index a9803e1..981dcca 100644 --- a/src/poparser.js +++ b/src/poparser.js @@ -121,8 +121,6 @@ Parser.prototype.types = { * String matches for lexer */ Parser.prototype.symbols = { - quotes: /["']/, - comments: /#/, whitespace: /\s/, key: /[\w\-[\]]/, keyNames: /^(?:msgctxt|msgid(?:_plural)?|msgstr(?:\[\d+])?)$/ @@ -146,7 +144,7 @@ Parser.prototype._lexer = function (chunk) { switch (this._state) { case this.states.none: case this.states.obsolete: - if (chr.match(this.symbols.quotes)) { + if (chr === '"' || chr === "'") { this._node = { type: this.types.string, value: '', @@ -154,7 +152,7 @@ Parser.prototype._lexer = function (chunk) { }; this._lex.push(this._node); this._state = this.states.string; - } else if (chr.match(this.symbols.comments)) { + } else if (chr === "#") { this._node = { type: this.types.comments, value: '' From 955eaa25aa0cb3e117fdf0742d66bcc6afeb3601 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Mon, 6 May 2024 00:48:49 +0200 Subject: [PATCH 6/8] fixes missing replacements for deprecated code (#90) - scripts - make sure that all is ready before fire the script --- package.json | 2 +- src/poparser.js | 4 ++-- src/shared.js | 4 ++-- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/package.json b/package.json index e0115d5..b259f4b 100644 --- a/package.json +++ b/package.json @@ -23,7 +23,7 @@ "test": "mocha", "preversion": "npm run lint && npm test", "postversion": "git push && git push --tags", - "prepublish": "tsc && npm run lint && npm run test" + "prepublishOnly": "npm i && tsc && npm run lint && npm run test" }, "main": "./lib/index.js", "types": "./lib/index.d.ts", diff --git a/src/poparser.js b/src/poparser.js index 981dcca..5ea9030 100644 --- a/src/poparser.js +++ b/src/poparser.js @@ -579,9 +579,9 @@ PoParserTransform.prototype._transform = function (chunk, encoding, done) { } // it seems we found some 8bit bytes from the end of the string, so let's cache these if (len) { - this._cache = [chunk.slice(chunk.length - len)]; + this._cache = [chunk.subarray(chunk.length - len)]; this._cacheSize = this._cache[0].length; - chunk = chunk.slice(0, chunk.length - len); + chunk = chunk.subarray(0, chunk.length - len); } // chunk might be empty if it only continued of 8bit bytes and these were all cached diff --git a/src/shared.js b/src/shared.js index 5e2d3a5..459858b 100644 --- a/src/shared.js +++ b/src/shared.js @@ -111,11 +111,11 @@ export function foldLine (str, maxLen = 76) { let match; while (pos < len) { - curLine = str.substr(pos, maxLen); + curLine = str.substring(pos, pos + maxLen); // ensure that the line never ends with a partial escaping // make longer lines if needed - while (curLine.substr(-1) === '\\' && pos + curLine.length < len) { + while (curLine.substring(-1) === '\\' && pos + curLine.length < len) { curLine += str.charAt(pos + curLine.length); } From c40a44c4cb6071444ef74f4de79f353c83d04992 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sun, 12 May 2024 21:02:46 +0200 Subject: [PATCH 7/8] fix missing types and jsDocs (#89) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * fix missing types and jsDocs * removing definition file, the definitions were moved to the type.js file * enhanced type for pocompiler and postream * enhancing js docs types * jsdocs types (still few error to solve) * @johnhooks review suggestions Co-authored-by: John Hooks * apply suggestion by johnhooks Co-authored-by: John Hooks * apply @johnhooks suggestions 🙌 * wip types * fixed types * allows tsc to fail in ci tests * fix: adjust typing of the parsers and compilers This commit adds missing types and attempts fix type errors. There are still a few type errors, though how to fix them is not clear. Adds the `Translations` type for the `translations` property of the `GetTextTranslations` type. * add imports for types * add encoding declaration * add types directory to tsconfig include * remove types directory from .gitignore --------- Co-authored-by: John Hooks --- .eslintrc.json | 3 +- .github/workflows/ci.yml | 17 ++- package.json | 2 - src/index.d.ts | 52 --------- src/index.js | 12 +- src/mocompiler.js | 142 +++++++++++++++-------- src/moparser.js | 122 +++++++++++--------- src/pocompiler.js | 212 ++++++++++++++++++++-------------- src/poparser.js | 237 ++++++++++++++++++++++++-------------- src/shared.js | 49 +++++--- src/types.js | 52 +++++++++ tsconfig.json | 26 ++--- types/encoding/index.d.ts | 3 + 13 files changed, 554 insertions(+), 375 deletions(-) delete mode 100644 src/index.d.ts create mode 100644 src/types.js create mode 100644 types/encoding/index.d.ts diff --git a/.eslintrc.json b/.eslintrc.json index bcfae6d..30149ce 100644 --- a/.eslintrc.json +++ b/.eslintrc.json @@ -3,8 +3,7 @@ "es2021": true, "node": true }, - "extends": ["eslint:recommended", "plugin:@typescript-eslint/recommended"], - "parser": "@typescript-eslint/parser", + "extends": "standard", "parserOptions": { "ecmaVersion": "latest", "sourceType": "module" diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index a9056d3..d9de309 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -3,15 +3,24 @@ on: - push - pull_request jobs: + build: + name: Build with tsc + runs-on: ubuntu-latest + continue-on-error: true + steps: + - uses: actions/checkout@v4 + - uses: actions/setup-node@v4 + with: + node-version: lts/* + - run: npm install + - run: npx tsc test: - name: Node.js ${{ matrix.node-version }} on ${{ matrix.os }} + name: Test ${{ matrix.node-version }} on ${{ matrix.os }} runs-on: ${{ matrix.os }} strategy: fail-fast: false matrix: - node-version: - - 18 - - 20 + node: [ 18, 20 ] os: - ubuntu-latest - windows-latest diff --git a/package.json b/package.json index b259f4b..69f7b0d 100644 --- a/package.json +++ b/package.json @@ -38,8 +38,6 @@ "@types/content-type": "^1.1.8", "@types/mocha": "latest", "@types/readable-stream": "^4.0.11", - "@typescript-eslint/eslint-plugin": "^6.18.1", - "@typescript-eslint/parser": "^6.14.0", "chai": "^5.0.3", "eslint": "^8.56.0", "eslint-config-standard": "^17.1.0", diff --git a/src/index.d.ts b/src/index.d.ts deleted file mode 100644 index 8adf7ea..0000000 --- a/src/index.d.ts +++ /dev/null @@ -1,52 +0,0 @@ -import { Transform } from "readable-stream"; - -export declare module 'encoding' { - export function convert(buf: Buffer, toCharset: string, fromCharset: string): Buffer; -} - -export interface Compiler { - _table: GetTextTranslations; - compile(): Buffer; -} - -export interface GetTextComment { - translator?: string; - reference?: string; - extracted?: string; - flag?: string; - previous?: string; -} - -export interface GetTextTranslation { - msgctxt?: string; - msgid: string; - msgid_plural?: string; - msgstr: string[]; - comments?: GetTextComment; -} - -export interface GetTextTranslations { - charset: string; - headers: { [headerName: string]: string }; - translations: { [msgctxt: string]: { [msgId: string]: GetTextTranslation } }; -} - -export interface parserOptions { - defaultCharset?: string; - validation?: boolean; -} - -export interface po { - parse: (buffer: Buffer | string, defaultCharset?: string) => GetTextTranslations; - compile: (table: GetTextTranslations, options?: parserOptions) => Buffer; - createParseStream: (options?: parserOptions, transformOptions?: import('readable-stream').TransformOptions) => Transform; -} - -export interface mo { - parse: (buffer: Buffer | string, defaultCharset?: string) => GetTextTranslations; - compile: (table: GetTextTranslations, options?: parserOptions) => Buffer; -} - -export * from "./@types"; - -export default { po, mo } as { po: po, mo: mo }; diff --git a/src/index.js b/src/index.js index 05e32a3..fe34104 100644 --- a/src/index.js +++ b/src/index.js @@ -1,4 +1,4 @@ -import * as poParser from './poparser.js'; +import { poParse, poStream } from './poparser.js'; import poCompiler from './pocompiler.js'; import moParser from './moparser.js'; import moCompiler from './mocompiler.js'; @@ -6,20 +6,16 @@ import moCompiler from './mocompiler.js'; /** * Translation parser and compiler for PO files * @see https://www.gnu.org/software/gettext/manual/html_node/PO.html - * - * @type {import("./index.d.ts").po} po */ export const po = { - parse: poParser.parse, - createParseStream: poParser.stream, + parse: poParse, + createParseStream: poStream, compile: poCompiler }; /** - * Translation parser and compiler for PO files + * Translation parser and compiler for MO files * @see https://www.gnu.org/software/gettext/manual/html_node/MO.html - * - * @type {import("./index.d.ts").mo} mo */ export const mo = { parse: moParser, diff --git a/src/mocompiler.js b/src/mocompiler.js index 229904d..f538a6d 100644 --- a/src/mocompiler.js +++ b/src/mocompiler.js @@ -2,11 +2,30 @@ import encoding from 'encoding'; import { HEADERS, formatCharset, generateHeader, compareMsgid } from './shared.js'; import contentType from 'content-type'; +/** + * @typedef {import('node:stream').Transform} Transform + * @typedef {import('./types.js').GetTextTranslation} GetTextTranslation + * @typedef {import('./types.js').GetTextTranslations} GetTextTranslations + * @typedef {import('./types.js').Translations} Translations + * @typedef {import('./types.js').WriteFunc} WriteFunc + */ + +/** + * @typedef {Object} Size Data about the size of the compiled MO object. + * @property {number} msgid The size of the msgid section. + * @property {number} msgstr The size of the msgstr section. + * @property {number} total The total size of the compiled MO object. + */ + +/** + * @typedef {{ msgid: Buffer, msgstr: Buffer }} TranslationBuffers A translation object partially parsed. + */ + /** * Exposes general compiler function. Takes a translation * object as a parameter and returns binary MO object * - * @param {import('./index.d.ts').GetTextTranslations} table Translation object + * @param {GetTextTranslations} table Translation object * @return {Buffer} Compiled binary MO object */ export default function (table) { @@ -16,66 +35,85 @@ export default function (table) { } /** - * Creates a MO compiler object. - * - * @constructor - * @param {import('./index.d.ts').GetTextTranslations} table Translation table as defined in the README - * @return {import('./index.d.ts').Compiler} Compiler + * Prepare the header object to be compatible with MO compiler + * @param {Record} headers the headers + * @return {Record} The prepared header */ -function Compiler (table = {}) { - this._table = table; - - let { headers = {}, translations = {} } = this._table; - - headers = Object.keys(headers).reduce((result, key) => { +function prepareMoHeaders (headers) { + return Object.keys(headers).reduce((result, key) => { const lowerKey = key.toLowerCase(); if (HEADERS.has(lowerKey)) { // POT-Creation-Date is removed in MO (see https://savannah.gnu.org/bugs/?49654) if (lowerKey !== 'pot-creation-date') { - result[HEADERS.get(lowerKey)] = headers[key]; + const value = HEADERS.get(lowerKey); + if (value) { + result[value] = headers[key]; + } } } else { result[key] = headers[key]; } return result; - }, {}); + }, /** @type {Record} */ ({})); +} - // filter out empty translations - translations = Object.keys(translations).reduce((result, msgctxt) => { +/** + * Prepare the translation object to be compatible with MO compiler + * @param {Translations} translations + * @return {Translations} + */ +function prepareTranslations (translations) { + return Object.keys(translations).reduce((result, msgctxt) => { const context = translations[msgctxt]; const msgs = Object.keys(context).reduce((result, msgid) => { - const hasTranslation = context[msgid].msgstr.some(item => !!item.length); + const TranslationMsgstr = context[msgid].msgstr; + const hasTranslation = TranslationMsgstr.some(item => !!item.length); if (hasTranslation) { result[msgid] = context[msgid]; } return result; - }, {}); + }, /** @type {Record} */({})); if (Object.keys(msgs).length) { result[msgctxt] = msgs; } return result; - }, {}); + }, /** @type {Translations} */({})); +} - this._table.translations = translations; - this._table.headers = headers; +/** + * Creates a MO compiler object. + * @this {Compiler & Transform} + * + * @param {GetTextTranslations} [table] Translation table as defined in the README + */ +function Compiler (table) { + /** @type {GetTextTranslations} _table The translation table */ + this._table = { + charset: undefined, + translations: prepareTranslations(table?.translations ?? {}), + headers: prepareMoHeaders(table?.headers ?? {}) + }; this._translations = []; - + /** + * @type {WriteFunc} + */ this._writeFunc = 'writeUInt32LE'; this._handleCharset(); -} -/** - * Magic bytes for the generated binary data - */ -Compiler.prototype.MAGIC = 0x950412de; + /** + * Magic bytes for the generated binary data + * @type {number} MAGIC file header magic value of mo file + */ + this.MAGIC = 0x950412de; +} /** * Handles header values, replaces or adds (if needed) a charset property @@ -96,17 +134,19 @@ Compiler.prototype._handleCharset = function () { /** * Generates an array of translation strings - * in the form of [{msgid:... , msgstr:...}] + * in the form of [{msgid:..., msgstr: ...}] * - * @return {Array} Translation strings array */ Compiler.prototype._generateList = function () { + /** @type {TranslationBuffers[]} */ const list = []; - list.push({ - msgid: Buffer.alloc(0), - msgstr: encoding.convert(generateHeader(this._table.headers), this._table.charset) - }); + if ('headers' in this._table) { + list.push({ + msgid: Buffer.alloc(0), + msgstr: encoding.convert(generateHeader(this._table.headers), this._table.charset) + }); + } Object.keys(this._table.translations).forEach(msgctxt => { if (typeof this._table.translations[msgctxt] !== 'object') { @@ -133,7 +173,7 @@ Compiler.prototype._generateList = function () { key += '\u0000' + msgidPlural; } - const value = [].concat(this._table.translations[msgctxt][msgid].msgstr || []).join('\u0000'); + const value = /** @type {string[]} */([]).concat(this._table.translations[msgctxt][msgid].msgstr ?? []).join('\u0000'); list.push({ msgid: encoding.convert(key, this._table.charset), @@ -148,20 +188,19 @@ Compiler.prototype._generateList = function () { /** * Calculate buffer size for the final binary object * - * @param {import('./index.d.ts').GetTextTranslations} list An array of translation strings from _generateList - * @return {Object} Size data of {msgid, msgstr, total} + * @param {TranslationBuffers[]} list An array of translation strings from _generateList + * @return {Size} Size data of {msgid, msgstr, total} */ Compiler.prototype._calculateSize = function (list) { let msgidLength = 0; let msgstrLength = 0; - let totalLength = 0; list.forEach(translation => { msgidLength += translation.msgid.length + 1; // + extra 0x00 msgstrLength += translation.msgstr.length + 1; // + extra 0x00 }); - totalLength = 4 + // magic number + const totalLength = 4 + // magic number 4 + // revision 4 + // string count 4 + // original string table offset @@ -183,9 +222,9 @@ Compiler.prototype._calculateSize = function (list) { /** * Generates the binary MO object from the translation list * - * @param {import('./index.d.ts').GetTextTranslations} list translation list - * @param {Object} size Byte size information - * @return {Buffer} Compiled MO object + * @param {TranslationBuffers[]} list translation list + * @param {Size} size Byte size information + * @return {Buffer} Compiled MO object */ Compiler.prototype._build = function (list, size) { const returnBuffer = Buffer.alloc(size.total); @@ -214,21 +253,23 @@ Compiler.prototype._build = function (list, size) { // hash table offset returnBuffer[this._writeFunc](28 + (4 + 4) * list.length * 2, 24); - // build originals table + // Build original table curPosition = 28 + 2 * (4 + 4) * list.length; for (i = 0, len = list.length; i < len; i++) { - list[i].msgid.copy(returnBuffer, curPosition); - returnBuffer[this._writeFunc](list[i].msgid.length, 28 + i * 8); - returnBuffer[this._writeFunc](curPosition, 28 + i * 8 + 4); + const msgidLength = /** @type {Buffer} */(/** @type {unknown} */(list[i].msgid)); + msgidLength.copy(returnBuffer, curPosition); + returnBuffer.writeUInt32LE(list[i].msgid.length, 28 + i * 8); + returnBuffer.writeUInt32LE(curPosition, 28 + i * 8 + 4); returnBuffer[curPosition + list[i].msgid.length] = 0x00; curPosition += list[i].msgid.length + 1; } - // build translations table + // build translation table for (i = 0, len = list.length; i < len; i++) { - list[i].msgstr.copy(returnBuffer, curPosition); - returnBuffer[this._writeFunc](list[i].msgstr.length, 28 + (4 + 4) * list.length + i * 8); - returnBuffer[this._writeFunc](curPosition, 28 + (4 + 4) * list.length + i * 8 + 4); + const msgstrLength = /** @type {Buffer} */(/** @type {unknown} */(list[i].msgstr)); + msgstrLength.copy(returnBuffer, curPosition); + returnBuffer.writeUInt32LE(list[i].msgstr.length, 28 + (4 + 4) * list.length + i * 8); + returnBuffer.writeUInt32LE(curPosition, 28 + (4 + 4) * list.length + i * 8 + 4); returnBuffer[curPosition + list[i].msgstr.length] = 0x00; curPosition += list[i].msgstr.length + 1; } @@ -237,8 +278,9 @@ Compiler.prototype._build = function (list, size) { }; /** - * Compiles translation object into a binary MO object + * Compiles a translation object into a binary MO object * + * @interface * @return {Buffer} Compiled MO object */ Compiler.prototype.compile = function () { diff --git a/src/moparser.js b/src/moparser.js index 43097cf..263efdb 100644 --- a/src/moparser.js +++ b/src/moparser.js @@ -1,12 +1,19 @@ import encoding from 'encoding'; import { formatCharset, parseHeader } from './shared.js'; +/** + * @typedef {import('./types.js').GetTextTranslations} GetTextTranslations + * @typedef {import('./types.js').GetTextTranslation} GetTextTranslation + * @typedef {import('./types.js').Translations} Translations + * @typedef {import('./types.js').WriteFunc} WriteFunc + * @typedef {import('./types.js').ReadFunc} ReadFunc + */ + /** * Parses a binary MO object into translation table * * @param {Buffer} buffer Binary MO object - * @param {String} [defaultCharset] Default charset to use - * @return {Object} Translation object + * @param {string} [defaultCharset] Default charset to use */ export default function (buffer, defaultCharset) { const parser = new Parser(buffer, defaultCharset); @@ -18,48 +25,53 @@ export default function (buffer, defaultCharset) { * Creates a MO parser object. * * @constructor - * @param {Buffer} fileContents Binary MO object - * @param {String} [defaultCharset] Default charset to use + * @param {Buffer|null} fileContents Binary MO object + * @param {string} [defaultCharset] Default charset to use */ function Parser (fileContents, defaultCharset = 'iso-8859-1') { this._fileContents = fileContents; + this._charset = defaultCharset; + /** - * Method name for writing int32 values, default littleendian - */ + * @type {WriteFunc} + */ this._writeFunc = 'writeUInt32LE'; /** - * Method name for reading int32 values, default littleendian - */ + * @type {ReadFunc} + */ this._readFunc = 'readUInt32LE'; - this._charset = defaultCharset; - + /** + * Translation table + * + * @type {GetTextTranslations} table Translation object + */ this._table = { charset: this._charset, - headers: undefined, + headers: {}, translations: {} }; -} -/** - * Magic constant to check the endianness of the input file - */ -Parser.prototype.MAGIC = 0x950412de; + /** + * Magic constant to check the endianness of the input file + */ + this.MAGIC = 0x950412de; +} /** - * Checks if number values in the input file are in big- or littleendian format. + * Checks if number values in the input file are in big- or little endian format. * - * @return {Boolean} Return true if magic was detected + * @return {boolean} Return true if magic was detected */ Parser.prototype._checkMagick = function () { - if (this._fileContents.readUInt32LE(0) === this.MAGIC) { + if (this._fileContents?.readUInt32LE(0) === this.MAGIC) { this._readFunc = 'readUInt32LE'; this._writeFunc = 'writeUInt32LE'; return true; - } else if (this._fileContents.readUInt32BE(0) === this.MAGIC) { + } else if (this._fileContents?.readUInt32BE(0) === this.MAGIC) { this._readFunc = 'readUInt32BE'; this._writeFunc = 'writeUInt32BE'; @@ -70,18 +82,23 @@ Parser.prototype._checkMagick = function () { }; /** - * Read the original strings and translations from the input MO file. Use the - * first translation string in the file as the header. + * Read the original strings and translations from the input MO file. + * Use the first translation string in the file as the header. */ Parser.prototype._loadTranslationTable = function () { - let offsetOriginals = this._offsetOriginals; - let offsetTranslations = this._offsetTranslations; + let offsetOriginals = this._offsetOriginals || 0; + let offsetTranslations = this._offsetTranslations || 0; let position; let length; let msgid; let msgstr; + // Return if there are no translations + if (!this._total) { this._fileContents = null; return; } + + // Loop through all strings in the MO file for (let i = 0; i < this._total; i++) { + if (this._fileContents === null) continue; // msgid string length = this._fileContents[this._readFunc](offsetOriginals); offsetOriginals += 4; @@ -89,7 +106,7 @@ Parser.prototype._loadTranslationTable = function () { offsetOriginals += 4; msgid = this._fileContents.subarray( position, - position + length, + position + length ); // matching msgstr @@ -99,7 +116,7 @@ Parser.prototype._loadTranslationTable = function () { offsetTranslations += 4; msgstr = this._fileContents.subarray( position, - position + length, + position + length ); if (!i && !msgid.toString()) { @@ -131,34 +148,31 @@ Parser.prototype._handleCharset = function (headers) { this._charset = this._table.charset = formatCharset(match[1], this._charset); } - headers = encoding.convert(headers, 'utf-8', this._charset) - .toString('utf8'); + headers = encoding.convert(headers, 'utf-8', this._charset); - this._table.headers = parseHeader(headers); + this._table.headers = parseHeader(headers.toString('utf8')); }; /** * Adds a translation to the translation object * - * @param {String} msgid Original string - * @params {String} msgstr Translation for the original string + * @param {string} msgidRaw Original string + * @param {string} msgstrRaw Translation for the original string */ -Parser.prototype._addString = function (msgid, msgstr) { +Parser.prototype._addString = function (msgidRaw, msgstrRaw) { const translation = {}; - let msgctxt; + let msgctxt = ''; let msgidPlural; - msgid = msgid.split('\u0004'); - if (msgid.length > 1) { - msgctxt = msgid.shift(); + const msgidArray = msgidRaw.split('\u0004'); + if (msgidArray.length > 1) { + msgctxt = msgidArray.shift() || ''; translation.msgctxt = msgctxt; - } else { - msgctxt = ''; } - msgid = msgid.join('\u0004'); + msgidRaw = msgidArray.join('\u0004'); - const parts = msgid.split('\u0000'); - msgid = parts.shift(); + const parts = msgidRaw.split('\u0000'); + const msgid = parts.shift() || ''; translation.msgid = msgid; @@ -166,8 +180,8 @@ Parser.prototype._addString = function (msgid, msgstr) { translation.msgid_plural = msgidPlural; } - msgstr = msgstr.split('\u0000'); - translation.msgstr = [].concat(msgstr || []); + const msgstr = msgstrRaw.split('\u0000'); + translation.msgstr = [...msgstr]; if (!this._table.translations[msgctxt]) { this._table.translations[msgctxt] = {}; @@ -179,31 +193,31 @@ Parser.prototype._addString = function (msgid, msgstr) { /** * Parses the MO object and returns translation table * - * @return {Object} Translation table + * @return {GetTextTranslations | false} Translation table */ Parser.prototype.parse = function () { - if (!this._checkMagick()) { + if (!this._checkMagick() || this._fileContents === null) { return false; } /** - * GetText revision nr, usually 0 - */ + * GetText revision nr, usually 0 + */ this._revision = this._fileContents[this._readFunc](4); /** - * Total count of translated strings - */ - this._total = this._fileContents[this._readFunc](8); + * @type {number} Total count of translated strings + */ + this._total = this._fileContents[this._readFunc](8) ?? 0; /** - * Offset position for original strings table - */ + * @type {number} Offset position for original strings table + */ this._offsetOriginals = this._fileContents[this._readFunc](12); /** - * Offset position for translation strings table - */ + * @type {number} Offset position for translation strings table + */ this._offsetTranslations = this._fileContents[this._readFunc](16); // Load translations into this._translationTable diff --git a/src/pocompiler.js b/src/pocompiler.js index 024492c..b107e88 100644 --- a/src/pocompiler.js +++ b/src/pocompiler.js @@ -1,13 +1,27 @@ -import encoding from 'encoding'; import { HEADERS, foldLine, compareMsgid, formatCharset, generateHeader } from './shared.js'; import contentType from 'content-type'; +import encoding from 'encoding'; + +/** + * @typedef {import('./types.js').GetTextTranslations} GetTextTranslations + * @typedef {import('./types.js').GetTextTranslation} GetTextTranslation + * @typedef {import('./types.js').GetTextComment} GetTextComment + * @typedef {import('./types.js').Translations} Translations + * @typedef {import('./types.js').ParserOptions} ParserOptions + */ + +/** + * @typedef {Partial> & { msgstr?: string | string[] }} PreOutputTranslation + */ + /** * Exposes general compiler function. Takes a translation * object as a parameter and returns PO object * - * @param {Object} table Translation object - * @return {Buffer} Compiled PO object + * @param {GetTextTranslations} table Translation object + * @param {ParserOptions} [options] Options + * @return {Buffer} The compiled PO object */ export default function (table, options) { const compiler = new Compiler(table, options); @@ -16,48 +30,52 @@ export default function (table, options) { } /** - * Creates a PO compiler object. + * Takes the header object and converts all headers into the lowercase format * - * @constructor - * @param {Object} table Translation table to be compiled + * @param {Record} headersRaw the headers to prepare + * @returns {Record} the headers in the lowercase format */ -function Compiler (table = {}, options = {}) { - this._table = table; - this._options = options; - - this._table.translations = this._table.translations || {}; - - let { headers = {} } = this._table; - - headers = Object.keys(headers).reduce((result, key) => { +export function preparePoHeaders (headersRaw) { + return Object.keys(headersRaw).reduce((result, key) => { const lowerKey = key.toLowerCase(); + const value = HEADERS.get(lowerKey); - if (HEADERS.has(lowerKey)) { - result[HEADERS.get(lowerKey)] = headers[key]; + if (typeof value === 'string') { + result[value] = headersRaw[key]; } else { - result[key] = headers[key]; + result[key] = headersRaw[key]; } return result; - }, {}); - - this._table.headers = headers; - - if (!('foldLength' in this._options)) { - this._options.foldLength = 76; - } - - if (!('escapeCharacters' in this._options)) { - this._options.escapeCharacters = true; - } - - if (!('sort' in this._options)) { - this._options.sort = false; - } + }, /** @type {Record} */ ({})); +} - if (!('eol' in this._options)) { - this._options.eol = '\n'; - } +/** + * Creates a PO compiler object. + * + * @constructor + * @param {GetTextTranslations} [table] Translation table to be compiled + * @param {ParserOptions} [options] Options + */ +function Compiler (table, options) { + this._table = table ?? { + headers: {}, + charset: undefined, + translations: {} + }; + this._table.translations = { ...this._table.translations }; + + /** @type {ParserOptions} _options The Options object */ + this._options = { + foldLength: 76, + escapeCharacters: true, + sort: false, + eol: '\n', + ...options + }; + + /** @type {Record}} the translation table */ + this._table.headers = preparePoHeaders(this._table.headers ?? {}); this._translations = []; @@ -65,14 +83,16 @@ function Compiler (table = {}, options = {}) { } /** - * Converts a comments object to a comment string. The comment object is - * in the form of {translator:'', reference: '', extracted: '', flag: '', previous:''} + * Converts a comment object to a comment string. The comment object is + * in the form of {translator: '', reference: '', extracted: '', flag: '', previous: ''} * - * @param {Object} comments A comments object - * @return {String} A comment string for the PO file + * @param {Record} comments A comments object + * @return {string} A comment string for the PO file */ Compiler.prototype._drawComments = function (comments) { + /** @var {Record[]} lines The comment lines to be returned */ const lines = []; + /** @var {{key: GetTextComment, prefix: string}} type The comment type */ const types = [{ key: 'translator', prefix: '# ' @@ -90,38 +110,47 @@ Compiler.prototype._drawComments = function (comments) { prefix: '#| ' }]; - types.forEach(type => { - if (!comments[type.key]) { - return; - } + for (const type of types) { + /** @var {string} value The comment type */ + const value = type.key; + + // ignore empty comments + if (!(value in comments)) { continue; } + + const commentLines = comments[value].split(/\r?\n|\r/); - comments[type.key].split(/\r?\n|\r/).forEach(line => { + // add comment lines to comments Array + for (const line of commentLines) { lines.push(`${type.prefix}${line}`); - }); - }); + } + } - return lines.join(this._options.eol); + return lines.length ? lines.join(this._options.eol) : ''; }; /** * Builds a PO string for a single translation object * - * @param {Object} block Translation object - * @param {Object} [override] Properties of this object will override `block` properties + * @param {PreOutputTranslation} block Translation object + * @param {Partial} [override] Properties of this object will override `block` properties * @param {boolean} [obsolete] Block is obsolete and must be commented out - * @return {String} Translation string for a single object + * @return {string} Translation string for a single object */ Compiler.prototype._drawBlock = function (block, override = {}, obsolete = false) { const response = []; const msgctxt = override.msgctxt || block.msgctxt; const msgid = override.msgid || block.msgid; const msgidPlural = override.msgid_plural || block.msgid_plural; - const msgstr = [].concat(override.msgstr || block.msgstr); - let comments = override.comments || block.comments; - - // add comments - if (comments && (comments = this._drawComments(comments))) { - response.push(comments); + const msgstrData = override.msgstr || block.msgstr; + const msgstr = Array.isArray(msgstrData) ? [...msgstrData] : [msgstrData]; + + /** @type {GetTextComment|undefined} */ + const comments = override.comments || block.comments; + if (comments) { + const drawnComments = this._drawComments(comments); + if (drawnComments) { + response.push(drawnComments); + } } if (msgctxt) { @@ -146,10 +175,10 @@ Compiler.prototype._drawBlock = function (block, override = {}, obsolete = false /** * Escapes and joins a key and a value for the PO string * - * @param {String} key Key name - * @param {String} value Key value + * @param {string} key Key name + * @param {string} value Key value * @param {boolean} [obsolete] PO string is obsolete and must be commented out - * @return {String} Joined and escaped key-value pair + * @return {string} Joined and escaped key-value pair */ Compiler.prototype._addPOString = function (key = '', value = '', obsolete = false) { key = key.toString(); @@ -176,7 +205,7 @@ Compiler.prototype._addPOString = function (key = '', value = '', obsolete = fal eol = eol + '#~ '; } - if (foldLength > 0) { + if (foldLength && foldLength > 0) { lines = foldLine(value, foldLength); } else { // split only on new lines @@ -202,49 +231,52 @@ Compiler.prototype._addPOString = function (key = '', value = '', obsolete = fal * Handles header values, replaces or adds (if needed) a charset property */ Compiler.prototype._handleCharset = function () { - const ct = contentType.parse(this._table.headers['Content-Type'] || 'text/plain'); + if (this._table.headers) { + const ct = contentType.parse(this._table.headers['Content-Type'] || 'text/plain'); - const charset = formatCharset(this._table.charset || ct.parameters.charset || 'utf-8'); + const charset = formatCharset(this._table.charset || ct.parameters.charset || 'utf-8'); - // clean up content-type charset independently using fallback if missing - if (ct.parameters.charset) { - ct.parameters.charset = formatCharset(ct.parameters.charset); - } + // clean up content-type charset independently using fallback if missing + if (ct.parameters.charset) { + ct.parameters.charset = formatCharset(ct.parameters.charset); + } - this._table.charset = charset; - this._table.headers['Content-Type'] = contentType.format(ct); + this._table.charset = charset; + this._table.headers['Content-Type'] = contentType.format(ct); + } }; /** * Flatten and sort translations object * - * @param {Object} section Object to be prepared (translations or obsolete) - * @returns {Array} Prepared array + * @param {Translations} section Object to be prepared (translations or obsolete) + * @returns {PreOutputTranslation[]|undefined} Prepared array */ Compiler.prototype._prepareSection = function (section) { + /** @type {GetTextTranslation[]} response Prepared array */ let response = []; - Object.keys(section).forEach(msgctxt => { + for (const msgctxt in section) { if (typeof section[msgctxt] !== 'object') { return; } - Object.keys(section[msgctxt]).forEach(msgid => { + for (const msgid of Object.keys(section[msgctxt])) { if (typeof section[msgctxt][msgid] !== 'object') { - return; + continue; } if (msgctxt === '' && msgid === '') { - return; + continue; } response.push(section[msgctxt][msgid]); - }); - }); + } + } const { sort } = this._options; - if (sort !== false) { + if (sort) { if (typeof sort === 'function') { response = response.sort(sort); } else { @@ -256,33 +288,37 @@ Compiler.prototype._prepareSection = function (section) { }; /** - * Compiles translation object into a PO object + * Compiles a translation object into a PO object * - * @return {Buffer} Compiled PO object + * @interface + * @return {Buffer} Compiled a PO object */ Compiler.prototype.compile = function () { + if (!this._table.translations) { + throw new Error('No translations found'); + } + /** @type {PreOutputTranslation} headerBlock */ const headerBlock = (this._table.translations[''] && this._table.translations['']['']) || {}; - let response = []; const translations = this._prepareSection(this._table.translations); - response = translations.map(r => this._drawBlock(r)); + let response = /** @type {(PreOutputTranslation|string)[]} */ (/** @type {unknown[]} */ (translations?.map(t => this._drawBlock(t)))); if (typeof this._table.obsolete === 'object') { const obsolete = this._prepareSection(this._table.obsolete); - if (obsolete.length) { - response = response.concat(obsolete.map(r => this._drawBlock(r, {}, true))); + if (obsolete && obsolete.length) { + response = response?.concat(obsolete.map(r => this._drawBlock(r, {}, true))); } } - const { eol } = this._options; + const eol = this._options.eol ?? '\n'; - response.unshift(this._drawBlock(headerBlock, { + response?.unshift(this._drawBlock(headerBlock, { msgstr: generateHeader(this._table.headers) })); if (this._table.charset === 'utf-8' || this._table.charset === 'ascii') { - return Buffer.from(response.join(eol + eol) + eol, 'utf-8'); + return Buffer.from(response?.join(eol + eol) + eol, 'utf-8'); } - return encoding.convert(response.join(eol + eol) + eol, this._table.charset); + return encoding.convert(response?.join(eol + eol) + eol, this._table.charset); }; diff --git a/src/poparser.js b/src/poparser.js index 5ea9030..3d209b7 100644 --- a/src/poparser.js +++ b/src/poparser.js @@ -1,16 +1,43 @@ import encoding from 'encoding'; -import { formatCharset, parseNPluralFromHeadersSafely, parseHeader } from './shared.js'; +import { formatCharset, parseHeader, parseNPluralFromHeadersSafely, ParserError } from './shared.js'; import { Transform } from 'readable-stream'; import util from 'util'; +/** + * @typedef {import('stream').Stream.Writable} WritableState + * @typedef {import('readable-stream').TransformOptions} TransformOptions + * @typedef {import('./types.js').GetTextTranslations} GetTextTranslations + * @typedef {import('./types.js').GetTextTranslation} GetTextTranslation + * @typedef {import('./types.js').GetTextComment} GetTextComment + * @typedef {import('./types.js').Translations} Translations + * @typedef {import('./types.js').ParserOptions} ParserOptions + */ + +/** + * @typedef {{ defaultCharset?: string, validation?: boolean }} Options Po parser options + */ + +/** + * @typedef {(...args: any[]) => void} DoneCallback + */ + +/** + * @typedef {Object} Node A single Node object in the PO file + * @property {string} [key] + * @property {number} [type] + * @property {string} value + * @property {string} [quote] + * @property {boolean} [obsolete] + * @property {GetTextComment | undefined} [comments] + */ + /** * Parses a PO object into translation table * - * @typedef {{ defaultCharset?: string, validation?: boolean }} Options * @param {string | Buffer} input PO object * @param {Options} [options] Optional options with defaultCharset and validation */ -export function parse (input, options = {}) { +export function poParse (input, options = {}) { const parser = new Parser(input, options); return parser.parse(); @@ -19,20 +46,17 @@ export function parse (input, options = {}) { /** * Parses a PO stream, emits translation table in object mode * - * @typedef {{ defaultCharset: string, validation: boolean }} Options * @param {Options} [options] Optional options with defaultCharset and validation - * @param {import('readable-stream').TransformOptions} [transformOptions] Optional stream options + * @param {TransformOptions} [transformOptions] Optional stream options */ -export function stream (options = {}, transformOptions = {}) { +export function poStream (options = {}, transformOptions = {}) { return new PoParserTransform(options, transformOptions); } /** - * Creates a PO parser object. If PO object is a string, - * UTF-8 will be used as the charset + * Creates a PO parser object. + * If a PO object is a string, UTF-8 will be used as the charset * - * @typedef {{ defaultCharset?: string, validation?: boolean }} Options - * @constructor * @param {string | Buffer} fileContents PO object * @param {Options} options Options with defaultCharset and validation */ @@ -40,8 +64,10 @@ function Parser (fileContents, { defaultCharset = 'iso-8859-1', validation = fal this._validation = validation; this._charset = defaultCharset; + /** @type {Node[]} Lexed tokens */ this._lex = []; this._escaped = false; + /** @type {Partial} */ this._node = {}; this._state = this.states.none; this._lineNumber = 1; @@ -68,9 +94,10 @@ Parser.prototype.parse = function () { /** * Detects charset for PO strings from the header * - * @param {Buffer} headers Header value + * @param {string | Buffer} buf Header value */ Parser.prototype._handleCharset = function (buf = '') { + /** @type {string} */ const str = buf.toString(); let pos; let headers = ''; @@ -92,6 +119,11 @@ Parser.prototype._handleCharset = function (buf = '') { return this._toString(buf); }; +/** + * Converts buffer to string + * @param {string | Buffer} buf Buffer to convert + * @return {string} Converted string + */ Parser.prototype._toString = function (buf) { return encoding.convert(buf, 'utf-8', this._charset).toString('utf-8'); }; @@ -125,11 +157,11 @@ Parser.prototype.symbols = { key: /[\w\-[\]]/, keyNames: /^(?:msgctxt|msgid(?:_plural)?|msgstr(?:\[\d+])?)$/ }; - /** * Token parser. Parsed state can be found from this._lex * - * @param {String} chunk String + * @param {string} chunk String + * @throws {ParserError} Throws a SyntaxError if the value doesn't match the key names. */ Parser.prototype._lexer = function (chunk) { let chr; @@ -150,14 +182,14 @@ Parser.prototype._lexer = function (chunk) { value: '', quote: chr }; - this._lex.push(this._node); + this._lex.push(/** @type {Node} */ (this._node)); this._state = this.states.string; - } else if (chr === "#") { + } else if (chr === '#') { this._node = { type: this.types.comments, value: '' }; - this._lex.push(this._node); + this._lex.push(/** @type {Node} */ (this._node)); this._state = this.states.comments; } else if (!chr.match(this.symbols.whitespace)) { this._node = { @@ -167,7 +199,7 @@ Parser.prototype._lexer = function (chunk) { if (this._state === this.states.obsolete) { this._node.obsolete = true; } - this._lex.push(this._node); + this._lex.push(/** @type {Node} */ (this._node)); this._state = this.states.key; } break; @@ -211,12 +243,8 @@ Parser.prototype._lexer = function (chunk) { break; case this.states.key: if (!chr.match(this.symbols.key)) { - if (!this._node.value.match(this.symbols.keyNames)) { - const err = new SyntaxError(`Error parsing PO data: Invalid key name "${this._node.value}" at line ${this._lineNumber}. This can be caused by an unescaped quote character in a msgid or msgstr value.`); - - err.lineNumber = this._lineNumber; - - throw err; + if (!this._node.value?.match(this.symbols.keyNames)) { + throw new ParserError(`Error parsing PO data: Invalid key name "${this._node.value}" at line ${this._lineNumber}. This can be caused by an unescaped quote character in a msgid or msgstr value.`, this._lineNumber); } this._state = this.states.none; i--; @@ -231,16 +259,17 @@ Parser.prototype._lexer = function (chunk) { /** * Join multi line strings * - * @param {Object} tokens Parsed tokens - * @return {Object} Parsed tokens, with multi line strings joined into one + * @param {Node[]} tokens Parsed tokens + * @return {Node[]} Parsed tokens, with multi line strings joined into one */ Parser.prototype._joinStringValues = function (tokens) { + /** @type {Node[]} */ const response = []; let lastNode; for (let i = 0, len = tokens.length; i < len; i++) { if (lastNode && tokens[i].type === this.types.string && lastNode.type === this.types.string) { - lastNode.value += tokens[i].value; + lastNode.value += tokens[i].value ?? ''; } else if (lastNode && tokens[i].type === this.types.comments && lastNode.type === this.types.comments) { lastNode.value += '\n' + tokens[i].value; } else { @@ -255,15 +284,17 @@ Parser.prototype._joinStringValues = function (tokens) { /** * Parse comments into separate comment blocks * - * @param {Object} tokens Parsed tokens + * @param {Node[]} tokens Parsed tokens */ Parser.prototype._parseComments = function (tokens) { - // parse comments - tokens.forEach(node => { + for (const node of tokens) { if (!node || node.type !== this.types.comments) { - return; + continue; } + /** @type {{ + [key: string]: string[]; + }} */ const comment = { translator: [], extracted: [], @@ -272,9 +303,10 @@ Parser.prototype._parseComments = function (tokens) { previous: [] }; + /** @type {string[]} */ const lines = (node.value || '').split(/\n/); - lines.forEach(line => { + for (const line of lines) { switch (line.charAt(0) || '') { case ':': comment.reference.push(line.substring(1).trim()); @@ -293,27 +325,31 @@ Parser.prototype._parseComments = function (tokens) { default: comment.translator.push(line.replace(/^\s+/, '')); } - }); + } - node.value = {}; + const finalToken = /** @type {Omit & { value: Record}} */ (/** @type {unknown} */ (node)); - Object.keys(comment).forEach(key => { - if (comment[key] && comment[key].length) { - node.value[key] = comment[key].join('\n'); + finalToken.value = {}; + + for (const key of Object.keys(comment)) { + if (key && comment[key]?.length) { + finalToken.value[key] = comment[key].join('\n'); } - }); - }); + } + } }; /** * Join gettext keys with values * - * @param {Object} tokens Parsed tokens - * @return {Object} Tokens + * @param {(Node & { value?: string })[]} tokens - Parsed tokens containing key-value pairs + * @return {Node[]} - An array of Nodes representing joined tokens */ Parser.prototype._handleKeys = function (tokens) { + /** @type {Node[]} */ const response = []; - let lastNode; + /** @type {Partial & { comments?: string }} */ + let lastNode = {}; for (let i = 0, len = tokens.length; i < len; i++) { if (tokens[i].type === this.types.key) { @@ -327,7 +363,7 @@ Parser.prototype._handleKeys = function (tokens) { lastNode.comments = tokens[i - 1].value; } lastNode.value = ''; - response.push(lastNode); + response.push(/** @type {Node} */ (lastNode)); } else if (tokens[i].type === this.types.string && lastNode) { lastNode.value += tokens[i].value; } @@ -339,22 +375,28 @@ Parser.prototype._handleKeys = function (tokens) { /** * Separate different values into individual translation objects * - * @param {Object} tokens Parsed tokens - * @return {Object} Tokens + * @param {Node[]} tokens Parsed tokens + * @return {GetTextTranslation[]} Tokens */ Parser.prototype._handleValues = function (tokens) { const response = []; - let lastNode; + /** @type {GetTextTranslation} Translation object */ + let lastNode = {}; + /** @type {string | undefined} */ let curContext; + /** @type {GetTextComment | undefined} */ let curComments; for (let i = 0, len = tokens.length; i < len; i++) { - if (tokens[i].key.toLowerCase() === 'msgctxt') { + const tokenKey = tokens[i].key; + if (!tokenKey) continue; + if (tokenKey.toLowerCase() === 'msgctxt') { curContext = tokens[i].value; curComments = tokens[i].comments; - } else if (tokens[i].key.toLowerCase() === 'msgid') { + } else if (tokenKey.toLowerCase() === 'msgid') { lastNode = { - msgid: tokens[i].value + msgid: tokens[i].value, + msgstr: [] }; if (tokens[i].obsolete) { lastNode.obsolete = true; @@ -372,10 +414,10 @@ Parser.prototype._handleValues = function (tokens) { lastNode.comments = tokens[i].comments; } - curContext = false; - curComments = false; + curContext = undefined; + curComments = undefined; response.push(lastNode); - } else if (tokens[i].key.toLowerCase() === 'msgid_plural') { + } else if (tokenKey.toLowerCase() === 'msgid_plural') { if (lastNode) { if (this._validation && 'msgid_plural' in lastNode) { throw new SyntaxError(`Multiple msgid_plural error: entry "${lastNode.msgid}" in "${lastNode.msgctxt || ''}" context has multiple msgid_plural declarations.`); @@ -388,19 +430,21 @@ Parser.prototype._handleValues = function (tokens) { lastNode.comments = tokens[i].comments; } - curContext = false; - curComments = false; - } else if (tokens[i].key.substring(0, 6).toLowerCase() === 'msgstr') { + curContext = undefined; + curComments = undefined; + } else if (tokenKey.substring(0, 6).toLowerCase() === 'msgstr') { if (lastNode) { - lastNode.msgstr = (lastNode.msgstr || []).concat(tokens[i].value); + const strData = lastNode.msgstr || []; + const tokenValue = tokens[i].value; + lastNode.msgstr = (strData).concat(tokenValue); } if (tokens[i].comments && !lastNode.comments) { lastNode.comments = tokens[i].comments; } - curContext = false; - curComments = false; + curContext = undefined; + curComments = undefined; } } @@ -410,11 +454,11 @@ Parser.prototype._handleValues = function (tokens) { /** * Validate token * - * @param {Object} token Parsed token - * @param {Object} translations Translation table + * @param {GetTextTranslation} token Parsed token + * @param {Translations} translations Translation table * @param {string} msgctxt Message entry context - * @param {number} nplurals Number of epected plural forms - * @throws Will throw an error if token validation fails + * @param {number} nplurals Number of expected plural forms + * @throws {Error} Will throw an error if token validation fails */ Parser.prototype._validateToken = function ( { @@ -426,10 +470,6 @@ Parser.prototype._validateToken = function ( msgctxt, nplurals ) { - if (!this._validation) { - return; - } - if (msgid in translations[msgctxt]) { throw new SyntaxError(`Duplicate msgid error: entry "${msgid}" in "${msgctxt}" context has already been declared.`); // eslint-disable-next-line camelcase @@ -445,20 +485,24 @@ Parser.prototype._validateToken = function ( /** * Compose a translation table from tokens object * - * @param {Object} tokens Parsed tokens - * @return {Object} Translation table + * @param {GetTextTranslation[]} tokens Parsed tokens + * @return {GetTextTranslations} Translation table */ Parser.prototype._normalize = function (tokens) { + /** + * Translation table to be returned + * @type {Omit & Partial> } table + */ const table = { charset: this._charset, headers: undefined, translations: {} }; let nplurals = 1; - let msgctxt; for (let i = 0, len = tokens.length; i < len; i++) { - msgctxt = tokens[i].msgctxt || ''; + /** @type {string} */ + const msgctxt = tokens[i].msgctxt || ''; if (tokens[i].obsolete) { if (!table.obsolete) { @@ -485,58 +529,73 @@ Parser.prototype._normalize = function (tokens) { nplurals = parseNPluralFromHeadersSafely(table.headers, nplurals); } - this._validateToken(tokens[i], table.translations, msgctxt, nplurals); + if (this._validation) { + this._validateToken(tokens[i], table.translations, msgctxt, nplurals); + } - table.translations[msgctxt][tokens[i].msgid] = tokens[i]; + const token = tokens[i]; + table.translations[msgctxt][token.msgid] = token; } - return table; + return /** @type {GetTextTranslations} */ (table); }; /** * Converts parsed tokens to a translation table * - * @param {Object} tokens Parsed tokens - * @returns {Object} Translation table + * @param {Node[]} tokens Parsed tokens + * @returns {GetTextTranslations} Translation table */ Parser.prototype._finalize = function (tokens) { + /** + * Translation table + */ let data = this._joinStringValues(tokens); this._parseComments(data); + // The PO parser gettext keys with values data = this._handleKeys(data); - data = this._handleValues(data); - return this._normalize(data); + // The PO parser individual translation objects + const dataset = this._handleValues(data); + return this._normalize(dataset); }; /** * Creates a transform stream for parsing PO input - * - * @typedef {{ defaultCharset: string, validation: boolean }} Options * @constructor - * @param {Options} options Optional options with defaultCharset and validation - * @param {import('readable-stream').TransformOptions} transformOptions Optional stream options + * @this {PoParserTransform & Transform} + * + * @param {ParserOptions} options Optional options with defaultCharset and validation + * @param {TransformOptions & {initialTreshold?: number;}} transformOptions Optional stream options */ function PoParserTransform (options, transformOptions) { + const { initialTreshold, ..._transformOptions } = transformOptions; this.options = options; + /** @type {Parser|false} */ this._parser = false; this._tokens = {}; + /** @type {Buffer[]} */ this._cache = []; this._cacheSize = 0; this.initialTreshold = transformOptions.initialTreshold || 2 * 1024; - Transform.call(this, transformOptions); + Transform.call(this, _transformOptions); + this._writableState.objectMode = false; this._readableState.objectMode = true; } util.inherits(PoParserTransform, Transform); /** - * Processes a chunk of the input stream - */ + * Processes a chunk of the input stream + * @param {Buffer} chunk Chunk of the input stream + * @param {string} encoding Encoding of the chunk + * @param {DoneCallback} done Callback to call when the chunk is processed + */ PoParserTransform.prototype._transform = function (chunk, encoding, done) { let i; let len = 0; @@ -588,7 +647,7 @@ PoParserTransform.prototype._transform = function (chunk, encoding, done) { if (chunk.length) { try { this._parser._lexer(this._parser._toString(chunk)); - } catch (error) { + } catch (/** @type {any} error */error) { setImmediate(() => { done(error); }); @@ -601,8 +660,10 @@ PoParserTransform.prototype._transform = function (chunk, encoding, done) { }; /** - * Once all input has been processed emit the parsed translation table as an object - */ + * Once all inputs have been processed, emit the parsed translation table as an object + * + * @param {DoneCallback} done Callback to call when the chunk is processed + */ PoParserTransform.prototype._flush = function (done) { let chunk; @@ -614,7 +675,7 @@ PoParserTransform.prototype._flush = function (done) { this._parser = new Parser(chunk, this.options); } - if (chunk) { + if (chunk && this._parser) { try { this._parser._lexer(this._parser._toString(chunk)); } catch (error) { @@ -627,7 +688,7 @@ PoParserTransform.prototype._flush = function (done) { } if (this._parser) { - this.push(this._parser._finalize(this._parser._lex)); + /** @type {any} */ (this).push(this._parser._finalize(this._parser._lex)); } setImmediate(done); diff --git a/src/shared.js b/src/shared.js index 459858b..ae005b7 100644 --- a/src/shared.js +++ b/src/shared.js @@ -1,5 +1,7 @@ // see https://www.gnu.org/software/gettext/manual/html_node/Header-Entry.html +/** @type {string} Header name for "Plural-Forms" */ const PLURAL_FORMS = 'Plural-Forms'; +/** @typedef {Map} Headers Map of header keys to header names */ export const HEADERS = new Map([ ['project-id-version', 'Project-Id-Version'], ['report-msgid-bugs-to', 'Report-Msgid-Bugs-To'], @@ -18,12 +20,14 @@ const PLURAL_FORM_HEADER_NPLURALS_REGEX = /nplurals\s*=\s*(?\d+)/; /** * Parses a header string into an object of key-value pairs * - * @param {String} str Header string - * @return {Object} An object of key-value pairs + * @param {string} str Header string + * @return {Record} An object of key-value pairs */ export function parseHeader (str = '') { - return str.split('\n') - .reduce((headers, line) => { + /** @type {string} Header string */ + return str + .split('\n') + .reduce((/** @type {Record} */ headers, line) => { const parts = line.split(':'); let key = (parts.shift() || '').trim(); @@ -42,7 +46,8 @@ export function parseHeader (str = '') { /** * Attempts to safely parse 'nplurals" value from "Plural-Forms" header * - * @param {Object} [headers = {}] An object with parsed headers + * @param {Record} [headers] An object with parsed headers + * @param {number} fallback Fallback value if "Plural-Forms" header is absent * @returns {number} Parsed result */ export function parseNPluralFromHeadersSafely (headers, fallback = 1) { @@ -62,8 +67,8 @@ export function parseNPluralFromHeadersSafely (headers, fallback = 1) { /** * Joins a header object of key value pairs into a header string * - * @param {Object} header Object of key value pairs - * @return {String} Header string + * @param {Record} header Object of key value pairs + * @return {string} An object of key-value pairs */ export function generateHeader (header = {}) { const keys = Object.keys(header) @@ -82,8 +87,9 @@ export function generateHeader (header = {}) { /** * Normalizes charset name. Converts utf8 to utf-8, WIN1257 to windows-1257 etc. * - * @param {String} charset Charset name - * @return {String} Normalized charset name + * @param {string} charset Charset name + * @param {string} defaultCharset Default charset name, defaults to 'iso-8859-1' + * @return {string} Normalized charset name */ export function formatCharset (charset = 'iso-8859-1', defaultCharset = 'iso-8859-1') { return charset.toString() @@ -99,8 +105,8 @@ export function formatCharset (charset = 'iso-8859-1', defaultCharset = 'iso-885 /** * Folds long lines according to PO format * - * @param {String} str PO formatted string to be folded - * @param {Number} [maxLen=76] Maximum allowed length for folded lines + * @param {string} str PO formatted string to be folded + * @param {number} [maxLen=76] Maximum allowed length for folded lines * @return {string[]} An array of lines */ export function foldLine (str, maxLen = 76) { @@ -125,7 +131,7 @@ export function foldLine (str, maxLen = 76) { curLine = match[0]; } else if (pos + curLine.length < len) { // if we're not at the end - if ((match = /.*\s+/.exec(curLine)) && /[^\s]/.test(match[0])) { + if ((match = /.*\s+/.exec(curLine)) && /\S/.test(match[0])) { // use everything before and including the last white space character (if anything) curLine = match[0]; } else if ((match = /.*[\x21-\x2f0-9\x5b-\x60\x7b-\x7e]+/.exec(curLine)) && /[^\x21-\x2f0-9\x5b-\x60\x7b-\x7e]/.test(match[0])) { @@ -144,8 +150,9 @@ export function foldLine (str, maxLen = 76) { /** * Comparator function for comparing msgid * - * @param {Object} object with msgid prev - * @param {Object} object with msgid next + * @template {Buffer|string} T + * @param {{msgid: T}} left with msgid prev + * @param {{msgid: T}} right with msgid next * @returns {number} comparator index */ export function compareMsgid ({ msgid: left }, { msgid: right }) { @@ -159,3 +166,17 @@ export function compareMsgid ({ msgid: left }, { msgid: right }) { return 0; } + +/** + * Custom SyntaxError subclass that includes the lineNumber property. + */ +export class ParserError extends SyntaxError { + /** + * @param {string} message - Error message. + * @param {number} lineNumber - Line number where the error occurred. + */ + constructor (message, lineNumber) { + super(message); + this.lineNumber = lineNumber; + } +} diff --git a/src/types.js b/src/types.js new file mode 100644 index 0000000..450d778 --- /dev/null +++ b/src/types.js @@ -0,0 +1,52 @@ +/** + * Represents a GetText comment. + * @typedef {Object} GetTextComment + * @property {string} [translator] Translator information. + * @property {string} [reference] Reference information. + * @property {string} [extracted] Extracted comments. + * @property {string} [flag] Flags. + * @property {string} [previous] Previous string. + */ + +/** + * Represents a GetText translation. + * @typedef {Object} GetTextTranslation + * @property {string} [msgctxt] Context of the message. + * @property {string} msgid The singular message ID. + * @property {string} [msgid_plural] The plural message ID. + * @property {string[]} msgstr Array of translated strings. + * @property {GetTextComment} [comments] Comments associated with the translation. + * @property {boolean} [obsolete] Whether the translation is obsolete. + */ + +/** + * @typedef {Record>} Translations The translations index. + */ + +/** + * Represents GetText translations. + * @typedef {Object} GetTextTranslations + * @property {string|undefined} charset Character set. + * @property {Record} headers Headers. + * @property {Translations} [obsolete] Obsolete messages. + * @property {Translations} translations Translations. + */ + +/** + * Options for the parser. + * @typedef {Object} ParserOptions + * @property {string} [defaultCharset] Default character set. + * @property {boolean} [validation] Whether to perform validation. + * @property {number} [foldLength] the fold length. + * @property {boolean} [escapeCharacters] Whether to escape characters. + * @property {boolean} [sort] Whether to sort messages. + * @property {string} [eol] End of line character. + */ + +/** + * @typedef {('writeUInt32LE'|'writeUInt32BE')} WriteFunc Type definition for write functions. + */ + +/** + * @typedef {('readUInt32LE'|'readUInt32BE')} ReadFunc Type definition for read functions. + */ diff --git a/tsconfig.json b/tsconfig.json index 96e5c6b..b82537e 100644 --- a/tsconfig.json +++ b/tsconfig.json @@ -4,34 +4,34 @@ "removeComments": false, "module": "Node16", "moduleResolution": "Node16", - "target": "ES2015", - + "target": "ES2018", + "lib": [ + "ES2018" + ], // Strict mode "strict": true, - // Allow javascript files "allowJs": true, - // Check js files for errors - "checkJs": false, - + "checkJs": true, // the directory sources are in "rootDir": "src", - // Output d.ts files to @types "outDir": "lib", - // Generate d.ts files "declaration": true, - // Minify "pretty": false, - // Skip lib check when compiling - "skipLibCheck": true + "skipLibCheck": true, + // For providing missing package types + "typeRoots": [ + "./types", + "./node_modules/@types" + ], }, "include": [ - "src/**/*.js", - "index.d.ts" + "src/**/*", + "types/**/*" ] } diff --git a/types/encoding/index.d.ts b/types/encoding/index.d.ts new file mode 100644 index 0000000..3150d35 --- /dev/null +++ b/types/encoding/index.d.ts @@ -0,0 +1,3 @@ +declare module 'encoding' { + function convert(buffer: Buffer | string, charset?: string, fromCharset?: string): Buffer; +} From f360d0830da049490f27f89d365ec2bfd6362a70 Mon Sep 17 00:00:00 2001 From: Erik Golinelli Date: Sun, 12 May 2024 21:03:45 +0200 Subject: [PATCH 8/8] Track coverage using C8 (#96) * track coverage using c8 * Fix: tests runs twice --- .github/workflows/ci.yml | 2 +- package.json | 3 ++- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index d9de309..2d240c8 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -30,4 +30,4 @@ jobs: with: node-version: ${{ matrix.node-version }} - run: npm install - - run: npm test + - run: npm run test:coverage diff --git a/package.json b/package.json index 69f7b0d..2bd36fe 100644 --- a/package.json +++ b/package.json @@ -21,6 +21,7 @@ "lint": "eslint src/*.js test/*.js", "test-generate-mo": "msgfmt test/fixtures/latin13.po -o test/fixtures/latin13.mo & msgfmt test/fixtures/utf8.po -o test/fixtures/utf8.mo & msgfmt test/fixtures/obsolete.po -o test/fixtures/obsolete.mo", "test": "mocha", + "test:coverage": "npx c8 --check-coverage npm run test", "preversion": "npm run lint && npm test", "postversion": "git push && git push --tags", "prepublishOnly": "npm i && tsc && npm run lint && npm run test" @@ -44,7 +45,7 @@ "eslint-plugin-import": "^2.29.1", "eslint-plugin-n": "^16.6.2", "eslint-plugin-promise": "^6.1.1", - "mocha": "^10.3.0", + "mocha": "^10.4.0", "typescript": "^5.4.5" }, "keywords": [