Skip to content

Commit

Permalink
Calculate checksum for filters and add a '! Checksum' meta to the fil…
Browse files Browse the repository at this point in the history
…ter list. #76

Squashed commit of the following:

commit a876ffc
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 19:20:40 2024 +0300

    add test for calculateChecksum

commit c7a0b15
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 17:45:29 2024 +0300

    fix indents

commit 3bdaa48
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 17:40:12 2024 +0300

    add test to check checksum value

commit 2e6d05e
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 16:59:09 2024 +0300

    update changelog

commit 44788ec
Merge: efbff9b 82247f9
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 16:56:14 2024 +0300

    Merge branch 'fix/#76_add_checksum' of ssh://bit.int.agrd.dev:7999/adguard-filters/hostlist-compiler into fix/#76_add_checksum

commit efbff9b
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 16:56:09 2024 +0300

    fix jsDoc comments

commit 82247f9
Author: Slava Leleka <[email protected]>
Date:   Fri Dec 13 16:55:45 2024 +0300

    Applied suggestion

commit 4ab778f
Author: jellizaveta <[email protected]>
Date:   Fri Dec 13 16:41:48 2024 +0300

    Calculate checksum for filters and add a '! Checksum' meta to the filter list. #76
  • Loading branch information
jellizaveta committed Dec 18, 2024
1 parent d304c09 commit abe6fa3
Show file tree
Hide file tree
Showing 6 changed files with 133 additions and 13 deletions.
7 changes: 7 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,13 @@ All notable changes to this project will be documented in this file.
The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).

## Unreleased

### Added

- Calculation of checksum for filters and `! Checksum` string to the filter list meta [#76]

[#76]: https://github.com/AdguardTeam/FiltersCompiler/issues/76

## [1.0.29] - 2024-09-26

Expand Down
16 changes: 8 additions & 8 deletions src/index.d.ts
Original file line number Diff line number Diff line change
@@ -1,12 +1,12 @@
declare module '@adguard/hostlist-compiler' {
export type SourceType = 'adblock' | 'hosts';
export type Transformation =
'RemoveComments' |
'Compress' |
'RemoveModifiers' |
'Validate' |
'Deduplicate' |

export type Transformation =
'RemoveComments' |
'Compress' |
'RemoveModifiers' |
'Validate' |
'Deduplicate' |
'InvertAllow' |
'RemoveEmptyLines' |
'TrimLines' |
Expand Down Expand Up @@ -62,7 +62,7 @@ declare module '@adguard/hostlist-compiler' {
* Compiles a filter list using the specified configuration.
*
* @param {*} configuration - compilation configuration.
See the repo README for the details on it.
* See the repo README for the details on it.
* @returns {Promise<Array<string>>} the array of rules.
*/
declare async function compile(configuration: IConfiguration): Promise<string[]>;
Expand Down
14 changes: 9 additions & 5 deletions src/index.js
Original file line number Diff line number Diff line change
Expand Up @@ -4,17 +4,17 @@ const config = require('./configuration');
const compileSource = require('./compile-source');
const { transform } = require('./transformations/transform');
const packageJson = require('../package.json');
const { calculateChecksum } = require('./utils');

/**
* Prepares list header
*
* @param {*} configuration - compilation configuration.
See the repo README for the details on it.
* See the repo README for the details on it.
* @returns {Array<string>} header lines
*/
function prepareHeader(configuration) {
const lines = [
'!',
`! Title: ${configuration.name}`,
];

Expand Down Expand Up @@ -67,7 +67,7 @@ function prepareSourceHeader(source) {
* Compiles a filter list using the specified configuration.
*
* @param {*} configuration - compilation configuration.
See the repo README for the details on it.
* See the repo README for the details on it.
* @returns {Promise<Array<string>>} the array of rules.
*/
async function compile(configuration) {
Expand Down Expand Up @@ -101,8 +101,12 @@ async function compile(configuration) {

// Now prepend the list header and we're good to go
const header = prepareHeader(configuration);
consola.info(`Final length of the list is ${header.length + finalList.length}`);
return header.concat(finalList);
// Calculate checksum
const checksum = calculateChecksum(header, finalList);
// Concat everything together
const data = ['!', checksum, ...header, ...finalList];
consola.info(`Final length of the list is ${data.length}`);
return data;
}

module.exports = compile;
43 changes: 43 additions & 0 deletions src/utils.js
Original file line number Diff line number Diff line change
@@ -1,7 +1,49 @@
const _ = require('lodash');
const fs = require('fs').promises;
const crypto = require('crypto');
const axios = require('axios');

/**
* Strips specified character from the end of a string.
*
* @param {string} string - The string to strip.
* @param {string} char - The character to strip.
* @returns {string} - The stripped string.
*/
const stripEnd = (str, char) => {
let result = str;
while (result.endsWith(char)) {
result = result.slice(0, -1);
}
return result;
};

/**
* Normalizes data by replacing newlines.
*
* @param {string} message - The message to normalize.
* @returns {string} - The normalized message.
*/
const normalizeData = (message) => {
return message.replace(/\r/g, '').replace(/\n+/g, '\n');
};

/**
* Calculates checksum for the given header and rules.
* See:
* https://adblockplus.org/en/filters#special-comments
* https://hg.adblockplus.org/adblockplus/file/tip/addChecksum.py
*
* @param {Array<string>} header - The header lines.
* @param {Array<string>} rules - The rules lines.
* @returns {string} - The calculated checksum.
*/
const calculateChecksum = (header, rules) => {
const content = normalizeData(header.concat(rules).join('\n'));
const checksum = crypto.createHash('md5').update(content).digest('base64');
return `! Checksum: ${stripEnd(checksum.trim(), '=')}`;
};

function isURL(str) {
try {
// eslint-disable-next-line no-unused-vars
Expand Down Expand Up @@ -169,6 +211,7 @@ class Wildcard {
}

module.exports = {
calculateChecksum,
download,
Wildcard,
splitByDelimiterWithEscapeCharacter,
Expand Down
37 changes: 37 additions & 0 deletions test/index.test.js
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
const nock = require('nock');
const consola = require('consola');
const compile = require('../src/index');
const { calculateChecksum } = require('../src/utils');

describe('Hostlist compiler', () => {
it('compile from multiple sources', async () => {
Expand Down Expand Up @@ -32,6 +33,7 @@ describe('Hostlist compiler', () => {
const list = await compile(configuration);

// assert
expect(list[1].startsWith('! Checksum:')).toBe(true);
expect(list).toContain('||example.org');
expect(list).toContain('||example.com');
expect(list).toContain('! Version: 1.0.0.9');
Expand All @@ -41,4 +43,39 @@ describe('Hostlist compiler', () => {

scope.done();
});

it('calculates checksum correctly', async () => {
// Prepare source
const scope = nock('https://example.org')
.get('/source1.txt')
.reply(200, '||example.org');

// compiler configuration
const configuration = {
name: 'Test filter',
description: 'Checksum test filter',
version: '1.0.0.1',
sources: [
{
name: 'source 1',
source: 'https://example.org/source1.txt',
},
],
};

// compile the final list
const list = await compile(configuration);

// assert
const checksumLine = list[1];
expect(checksumLine.startsWith('! Checksum:')).toBe(true);

const header = list.slice(2, list.indexOf('||example.org'));
const finalList = list.slice(list.indexOf('||example.org'));

const expectedChecksum = calculateChecksum(header, finalList);
expect(checksumLine).toBe(expectedChecksum);

scope.done();
});
});
29 changes: 29 additions & 0 deletions test/utils.test.js
Original file line number Diff line number Diff line change
Expand Up @@ -34,3 +34,32 @@ describe('substringBetween', () => {
expect(substr).toBe(null);
});
});

describe('calculateChecksum', () => {
it('calculates checksum with multiple headers and rules', () => {
const header = ['[Adblock Plus 2.0]', '! Title: Example filter list'];
const rules = ['! Checksum: ', '||example.com^', '||test.com^'];
const expectedChecksum = '! Checksum: h0eMYV8/e57vDmGsYZRhsg';

const checksum = utils.calculateChecksum(header, rules);
expect(checksum).toBe(expectedChecksum);
});

it('calculates checksum with empty rules', () => {
const header = ['[Adblock Plus 2.0]'];
const rules = [];
const expectedChecksum = '! Checksum: 87GLA4VsMnV9PiusIkPkEg';

const checksum = utils.calculateChecksum(header, rules);
expect(checksum).toBe(expectedChecksum);
});

it('calculates checksum with empty header and rules', () => {
const header = [];
const rules = [];
const expectedChecksum = '! Checksum: 1B2M2Y8AsgTpgAmY7PhCfg';

const checksum = utils.calculateChecksum(header, rules);
expect(checksum).toBe(expectedChecksum);
});
});

0 comments on commit abe6fa3

Please sign in to comment.