Skip to content

Commit 6faf50d

Browse files
committed
feat: add optional support for source locations
1 parent 9676edd commit 6faf50d

File tree

3 files changed

+105
-2
lines changed

3 files changed

+105
-2
lines changed

src/index.ts

+42-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
import {Parser, ParserOptions} from 'htmlparser2';
2-
import {Directive, Node, Options, Attributes} from '../types/index.d';
2+
import {Directive, Node, NodeTag, Options, Attributes} from '../types/index.d';
33

44
const defaultOptions: ParserOptions = {
55
lowerCaseTags: false,
@@ -49,6 +49,34 @@ const parser = (html: string, options: Options = {}): Node[] => {
4949
return result;
5050
}
5151

52+
const lastLoc = {
53+
line: 1,
54+
column: 1
55+
};
56+
57+
let lastIndex = 0;
58+
function getLoc(index: number) {
59+
if (index < lastIndex) {
60+
throw new Error('Source indices must be monotonic');
61+
}
62+
63+
while (lastIndex < index) {
64+
if (html.charCodeAt(lastIndex) === /* \n */ 10) {
65+
lastLoc.line++;
66+
lastLoc.column = 1;
67+
} else {
68+
lastLoc.column++;
69+
}
70+
71+
lastIndex++;
72+
}
73+
74+
return {
75+
line: lastLoc.line,
76+
column: lastLoc.column
77+
};
78+
}
79+
5280
function onprocessinginstruction(name: string, data: string) {
5381
const directives = defaultDirectives.concat(options.directives ?? []);
5482
const last: Node = bufferArrayLast();
@@ -92,7 +120,15 @@ const parser = (html: string, options: Options = {}): Node[] => {
92120
}
93121

94122
function onopentag(tag: string, attrs: Attributes) {
95-
const buf: Node = {tag};
123+
const start = getLoc(parser.startIndex);
124+
const buf: NodeTag = {tag};
125+
126+
if (options.sourceLocations) {
127+
buf.loc = {
128+
start,
129+
end: start
130+
};
131+
}
96132

97133
if (Object.keys(attrs).length > 0) {
98134
buf.attrs = normalizeArributes(attrs);
@@ -104,6 +140,10 @@ const parser = (html: string, options: Options = {}): Node[] => {
104140
function onclosetag() {
105141
const buf: Node | undefined = bufArray.pop();
106142

143+
if (buf && typeof buf === 'object' && buf.loc && parser.endIndex !== null) {
144+
buf.loc.end = getLoc(parser.endIndex);
145+
}
146+
107147
if (buf) {
108148
const last = bufferArrayLast();
109149

test/test-core.spec.ts

+52
Original file line numberDiff line numberDiff line change
@@ -240,3 +240,55 @@ test('should be not converting html entity name', t => {
240240
const expected = ['&zwnj;&nbsp;&copy;'];
241241
t.deepEqual(tree, expected);
242242
});
243+
244+
test('should parse with source locations', t => {
245+
const html = '<h1>Test</h1>\n<p><b>Foo</b></p>';
246+
const tree = parser(html, {sourceLocations: true});
247+
const expected = [
248+
{
249+
tag: 'h1',
250+
content: ['Test'],
251+
loc: {
252+
start: {
253+
line: 1,
254+
column: 1
255+
},
256+
end: {
257+
line: 1,
258+
column: 13
259+
}
260+
}
261+
},
262+
'\n',
263+
{
264+
tag: 'p',
265+
content: [
266+
{
267+
tag: 'b',
268+
content: ['Foo'],
269+
loc: {
270+
start: {
271+
line: 2,
272+
column: 4
273+
},
274+
end: {
275+
line: 2,
276+
column: 13
277+
}
278+
}
279+
}
280+
],
281+
loc: {
282+
start: {
283+
line: 2,
284+
column: 1
285+
},
286+
end: {
287+
line: 2,
288+
column: 17
289+
}
290+
}
291+
}
292+
];
293+
t.deepEqual(tree, expected);
294+
});

types/index.d.ts

+11
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@ export type Directive = {
1212

1313
export type Options = {
1414
directives?: Directive[];
15+
sourceLocations?: boolean;
1516
} & ParserOptions;
1617

1718
export type Node = NodeText | NodeTag;
@@ -20,6 +21,16 @@ export type NodeTag = {
2021
tag?: string | boolean;
2122
attrs?: Attributes;
2223
content?: Node[];
24+
loc?: SourceLocation;
2325
};
2426

2527
export type Attributes = Record<string, string>;
28+
export type SourceLocation = {
29+
start: Position;
30+
end: Position;
31+
};
32+
33+
export type Position = {
34+
line: number;
35+
column: number;
36+
};

0 commit comments

Comments
 (0)