Skip to content

Commit

Permalink
Add support for inline comment
Browse files Browse the repository at this point in the history
  • Loading branch information
VincentLanglet committed Dec 10, 2024
1 parent a193004 commit 9d06487
Show file tree
Hide file tree
Showing 8 changed files with 99 additions and 15 deletions.
16 changes: 16 additions & 0 deletions docs/custom.md
Original file line number Diff line number Diff line change
Expand Up @@ -137,6 +137,22 @@ The `TwigCsFixer\Token\Tokenizer` transform the file into a list of tokens which

The `#}` delimiter.

- **TwigCsFixer\Token\Token::INLINE_COMMENT_START_TYPE**:

The `#` delimiter.

- **TwigCsFixer\Token\Token::INLINE_COMMENT_TEXT_TYPE**:

Any commented text inside an inline comment. Does not include whitespaces.

- **TwigCsFixer\Token\Token::INLINE_COMMENT_WHITESPACE_TYPE**:

Any commented whitespace inside an inline comment.

- **TwigCsFixer\Token\Token::INLINE_COMMENT_TAB_TYPE**:

Any commented tabulation inside an inline comment.

- **TwigCsFixer\Token\Token::NAMED_ARGUMENT_SEPARATOR_TYPE**:

The `=` or `:` separator used when using named argument. Like `{{ foo(bar=true, baz: false) }}`.
Expand Down
6 changes: 6 additions & 0 deletions src/Token/Token.php
Original file line number Diff line number Diff line change
Expand Up @@ -43,16 +43,22 @@ final class Token
public const COMMENT_TAB_TYPE = 'COMMENT_TAB_TYPE';
public const COMMENT_EOL_TYPE = 'COMMENT_EOL_TYPE';
public const COMMENT_END_TYPE = 'COMMENT_END_TYPE';
public const INLINE_COMMENT_START_TYPE = 'INLINE_COMMENT_START_TYPE';
public const INLINE_COMMENT_TEXT_TYPE = 'INLINE_COMMENT_TEXT_TYPE';
public const INLINE_COMMENT_WHITESPACE_TYPE = 'INLINE_COMMENT_WHITESPACE_TYPE';
public const INLINE_COMMENT_TAB_TYPE = 'INLINE_COMMENT_TAB_TYPE';
public const NAMED_ARGUMENT_SEPARATOR_TYPE = 'NAMED_ARGUMENT_SEPARATOR_TYPE';

public const WHITESPACE_TOKENS = [
self::WHITESPACE_TYPE => self::WHITESPACE_TYPE,
self::COMMENT_WHITESPACE_TYPE => self::COMMENT_WHITESPACE_TYPE,
self::INLINE_COMMENT_WHITESPACE_TYPE => self::INLINE_COMMENT_WHITESPACE_TYPE,
];

public const TAB_TOKENS = [
self::TAB_TYPE => self::TAB_TYPE,
self::COMMENT_TAB_TYPE => self::COMMENT_TAB_TYPE,
self::INLINE_COMMENT_TAB_TYPE => self::INLINE_COMMENT_TAB_TYPE,
];

public const INDENT_TOKENS = self::WHITESPACE_TOKENS + self::TAB_TOKENS;
Expand Down
56 changes: 45 additions & 11 deletions src/Token/Tokenizer.php
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,7 @@ final class Tokenizer implements TokenizerInterface
private const STATE_DQ_STRING = 3;
private const STATE_INTERPOLATION = 4;
private const STATE_COMMENT = 5;
private const STATE_INLINE_COMMENT = 6;

public const NAME_PATTERN = '[a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*';
public const NUMBER_PATTERN = '[0-9]+(?:\.[0-9]+)?([Ee][+\-][0-9]+)?';
Expand Down Expand Up @@ -66,7 +67,7 @@ final class Tokenizer implements TokenizerInterface
private array $expressionStarters = [];

/**
* @var array<array{int<0, 5>, array<string, string|null>}>
* @var array<array{int<0, 6>, array<string, string|null>}>
*/
private array $state = [];

Expand Down Expand Up @@ -130,6 +131,9 @@ public function tokenize(Source $source): Tokens
case self::STATE_COMMENT:
$this->lexComment();
break;
case self::STATE_INLINE_COMMENT:
$this->lexInlineComment();
break;
}

if (
Expand Down Expand Up @@ -195,7 +199,7 @@ private function isInTernary(): bool
}

/**
* @return int<0, 5>
* @return int<0, 6>
*/
private function getState(): int
{
Expand All @@ -205,7 +209,7 @@ private function getState(): int
}

/**
* @param int<0, 5> $state
* @param int<0, 6> $state
*/
private function pushState(int $state): void
{
Expand Down Expand Up @@ -346,6 +350,8 @@ private function lexExpression(): void
$this->lexString($match[0]);
} elseif (1 === preg_match(self::REGEX_DQ_STRING_DELIM, $this->code, $match, 0, $this->cursor)) {
$this->lexStartDqString();
} elseif ('#' === $currentCode) {
$this->lexStartInlineComment();
} else {
throw CannotTokenizeException::unexpectedCharacter($currentCode, $this->line);
}
Expand Down Expand Up @@ -401,7 +407,7 @@ private function lexComment(): void
$this->popState();
} else {
if (!$this->hasStateParam('ignoredViolations')) {
$comment = substr($this->code, $this->cursor, $match[0][1]);
$comment = substr($this->code, $this->cursor, $match[0][1] - $this->cursor);
$this->extractIgnoredViolations($comment);
}

Expand All @@ -410,6 +416,19 @@ private function lexComment(): void
}
}

private function lexInlineComment(): void
{
if (!$this->hasStateParam('ignoredViolations')) {
preg_match('/(\r\n|\r|\n)/', $this->code, $match, \PREG_OFFSET_CAPTURE, $this->cursor);
$comment = substr($this->code, $this->cursor, isset($match[0]) ? $match[0][1] - $this->cursor : null);

$this->extractIgnoredViolations($comment);
$this->processIgnoredViolations();
}

$this->lexData();
}

private function lexDqString(): void
{
if (1 === preg_match(self::REGEX_INTERPOLATION_START, $this->code, $match, 0, $this->cursor)) {
Expand Down Expand Up @@ -465,14 +484,16 @@ private function lexData(int $limit = 0): void
} elseif (1 === preg_match('/\S+/', $this->code, $match, 0, $this->cursor)) {
$value = $match[0];

// Stop if cursor reaches the next expression starter.
if (0 !== $limit) {
$value = substr($value, 0, $limit - $this->cursor);
}

if (self::STATE_COMMENT === $this->getState()) {
$this->pushToken(Token::COMMENT_TEXT_TYPE, $value);
} elseif (self::STATE_INLINE_COMMENT === $this->getState()) {
$this->pushToken(Token::INLINE_COMMENT_TEXT_TYPE, $value);
} else {
// Stop if cursor reaches the next expression starter.
if (0 !== $limit) {
$value = substr($value, 0, $limit - $this->cursor);
}

$this->pushToken(Token::TEXT_TYPE, $value);
}
} else {
Expand Down Expand Up @@ -514,6 +535,12 @@ private function lexStart(): void
$this->pushState($state);
}

private function lexStartInlineComment(): void
{
$this->pushToken(Token::INLINE_COMMENT_START_TYPE, '#');
$this->pushState(self::STATE_INLINE_COMMENT);
}

private function lexStartDqString(): void
{
$token = $this->pushToken(Token::DQ_STRING_START_TYPE, '"');
Expand All @@ -539,6 +566,8 @@ private function lexTab(): void

if (self::STATE_COMMENT === $this->getState()) {
$this->pushToken(Token::COMMENT_TAB_TYPE, $whitespace);
} elseif (self::STATE_INLINE_COMMENT === $this->getState()) {
$this->pushToken(Token::INLINE_COMMENT_TAB_TYPE, $whitespace);
} else {
$this->pushToken(Token::TAB_TYPE, $whitespace);
}
Expand All @@ -555,6 +584,8 @@ private function lexWhitespace(): void

if (self::STATE_COMMENT === $this->getState()) {
$this->pushToken(Token::COMMENT_WHITESPACE_TYPE, $whitespace);
} elseif (self::STATE_INLINE_COMMENT === $this->getState()) {
$this->pushToken(Token::INLINE_COMMENT_WHITESPACE_TYPE, $whitespace);
} else {
$this->pushToken(Token::WHITESPACE_TYPE, $whitespace);
}
Expand All @@ -564,6 +595,9 @@ private function lexEOL(string $eol): void
{
if (self::STATE_COMMENT === $this->getState()) {
$this->pushToken(Token::COMMENT_EOL_TYPE, $eol);
} elseif (self::STATE_INLINE_COMMENT === $this->getState()) {
$this->pushToken(Token::EOL_TYPE, $eol);
$this->popState();
} else {
$this->pushToken(Token::EOL_TYPE, $eol);
}
Expand Down Expand Up @@ -774,8 +808,8 @@ private function getOperatorRegex(Environment $env): string
private function extractIgnoredViolations(string $comment): void
{
$comment = trim($comment);
if (1 === preg_match('/^twig-cs-fixer-disable(|-line|-next-line)\s+([\s\w,.:]*)/i', $comment, $match)) {
$this->setStateParam('ignoredViolations', preg_replace('/\s+/', ',', $match[2]) ?? '');
if (1 === preg_match('/^twig-cs-fixer-disable(|-line|-next-line)(?:$|\s+([\s\w,.:]*))/i', $comment, $match)) {
$this->setStateParam('ignoredViolations', preg_replace('/\s+/', ',', $match[2] ?? '') ?? '');
$this->setStateParam('ignoredType', trim($match[1], '-'));
} else {
$this->setStateParam('ignoredViolations', null);
Expand Down
4 changes: 4 additions & 0 deletions tests/Token/Tokenizer/Fixtures/ignored_violations.twig
Original file line number Diff line number Diff line change
Expand Up @@ -3,3 +3,7 @@
{# twig-cs-fixer-disable-line Foo.Bar #}
{# twig-cs-fixer-disable-next-line Foo.Bar Bar.Foo #}
{# twig-cs-fixer-disable-next-line #}

# twig-cs-fixer-disable-next-line
{{ # twig-cs-fixer-disable-next-line
}}
2 changes: 1 addition & 1 deletion tests/Token/Tokenizer/Fixtures/invalid5.twig
Original file line number Diff line number Diff line change
@@ -1 +1 @@
{{ "#{p.first #{}}" }}
{# foo
1 change: 0 additions & 1 deletion tests/Token/Tokenizer/Fixtures/invalid6.twig

This file was deleted.

4 changes: 4 additions & 0 deletions tests/Token/Tokenizer/Fixtures/test17.twig
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
{{
# Inline comment
foo
}}
25 changes: 23 additions & 2 deletions tests/Token/Tokenizer/TokenizerTest.php
Original file line number Diff line number Diff line change
Expand Up @@ -116,6 +116,7 @@ public function testTokenizeIgnoredViolations(): void
'Foo.Bar:5',
'Bar.Foo:5',
':6',
':9',
],
array_map(
static fn (ViolationId $validationId) => $validationId->toString(),
Expand Down Expand Up @@ -814,6 +815,27 @@ public static function tokenizeDataProvider(): iterable
19 => Token::EOF_TYPE,
],
];

yield [
__DIR__.'/Fixtures/test17.twig',
[
0 => Token::VAR_START_TYPE,
1 => Token::EOL_TYPE,
2 => Token::WHITESPACE_TYPE,
3 => Token::INLINE_COMMENT_START_TYPE,
4 => Token::INLINE_COMMENT_WHITESPACE_TYPE,
5 => Token::INLINE_COMMENT_TEXT_TYPE,
6 => Token::INLINE_COMMENT_TAB_TYPE,
7 => Token::INLINE_COMMENT_TEXT_TYPE,
8 => Token::EOL_TYPE,
9 => Token::WHITESPACE_TYPE,
10 => Token::NAME_TYPE,
11 => Token::EOL_TYPE,
12 => Token::VAR_END_TYPE,
13 => Token::EOL_TYPE,
14 => Token::EOF_TYPE,
],
];
}

/**
Expand Down Expand Up @@ -842,7 +864,6 @@ public static function tokenizeInvalidDataProvider(): iterable
yield [__DIR__.'/Fixtures/invalid2.twig', 'Unexpected character "&" at line 4.'];
yield [__DIR__.'/Fixtures/invalid3.twig', 'Unclosed "(" at line 1.'];
yield [__DIR__.'/Fixtures/invalid4.twig', 'Unexpected character ")" at line 1.'];
yield [__DIR__.'/Fixtures/invalid5.twig', 'Unexpected character "#" at line 1.'];
yield [__DIR__.'/Fixtures/invalid6.twig', 'Unclosed comment at line 1.'];
yield [__DIR__.'/Fixtures/invalid5.twig', 'Unclosed comment at line 1.'];
}
}

0 comments on commit 9d06487

Please sign in to comment.