RetroSearch Browse

(

), NumTokens(NumTokens) {}

63

Scanner(StringRef Input,

66

: Input(Input), Tokens(Tokens), Diags(Diags),

67

InputSourceLoc(InputSourceLoc), LangOpts(getLangOptsForDepScanning()),

68

TheLexer(InputSourceLoc, LangOpts, Input.begin(), Input.begin(),

74

LangOpts.ObjC =

true

;

75

LangOpts.LineComment =

true

;

76

LangOpts.RawStringLiterals =

true

;

89

lexToken(

const char

const char

const

End);

92

lexIncludeFilename(

const char

const char

const

End);

94 void

skipLine(

const char

const char

const

End);

95 void

skipDirective(StringRef Name,

const char

const char

const

End);

106

[[nodiscard]] std::optional<StringRef>

107

tryLexIdentifierOrSkipLine(

const char

const char

const

End);

110

[[nodiscard]] StringRef lexIdentifier(

const char

111 const char

const

End);

118

[[nodiscard]]

bool

isNextIdentifierOrSkipLine(StringRef

119 const char

120 const char

const

End);

128 const char

const

End);

135

[[nodiscard]] std::optional<StringRef>

136

tryLexStringLiteralOrSkipLine(

const char

const char

const

End);

138

[[nodiscard]]

bool

scanImpl(

const char

const char

const

End);

139

[[nodiscard]]

bool

lexPPLine(

const char

const char

const

End);

140

[[nodiscard]]

bool

lexAt(

const char

const char

const

End);

141

[[nodiscard]]

bool

lexModule(

const char

const char

const

End);

142

[[nodiscard]]

bool

lexDefine(

const char

*HashLoc,

const char

143 const char

const

End);

144

[[nodiscard]]

bool

lexPragma(

const char

const char

const

End);

145

[[nodiscard]]

bool

lex_Pragma(

const char

const char

const

End);

146

[[nodiscard]]

bool

lexEndif(

const char

const char

const

End);

148 const char

const

End);

149

[[nodiscard]]

bool

lexModuleDirectiveBody(

DirectiveKind

Kind,

150 const char

151 const char

const

End);

152 void

lexPPDirectiveBody(

const char

const char

const

End);

155

Tokens.append(CurDirToks);

156

DirsWithToks.emplace_back(Kind, CurDirToks.size());

158 return

DirsWithToks.back();

160 void

popDirective() {

161

Tokens.pop_back_n(DirsWithToks.pop_back_val().NumTokens);

164 return

DirsWithToks.empty() ?

pp_none

: DirsWithToks.back().Kind;

167 unsigned

getOffsetAt(

const char

*CurPtr)

const

{

168 return

CurPtr - Input.data();

173 bool

reportError(

const char

*CurPtr,

unsigned

Err);

175

StringMap<char> SplitIds;

181 const char

*LastTokenPtr =

nullptr

;

196bool

Scanner::reportError(

const char

*CurPtr,

unsigned

Err) {

199

assert(CurPtr >= Input.data() &&

"invalid buffer ptr"

);

200

Diags->Report(InputSourceLoc.getLocWithOffset(getOffsetAt(CurPtr)), Err);

210 const char

*Current) {

211

assert(

<= Current);

214 if

(*Current !=

'"'

== Current)

219 if

(*Current !=

'R'

)

225 if

(*Current ==

'u'

|| *Current ==

'U'

|| *Current ==

'L'

)

229 if

(*Current !=

'8'

== Current || *Current-- !=

'u'

)

235

assert(

[0] ==

'"'

);

236

assert(

[-1] ==

'R'

);

239 while

(

!= End && *

'('

)

258 while

(

!= End &&

size_t

(

) < Terminator.size() &&

267 if

(

size_t

(

) < Terminator.size())

277static unsigned isEOL

(

const char

const char

const

End) {

288 const char

Terminator = *

'<'

'>'

: *

;

293 if

'\\'

)

303 const char

*FirstAfterBackslashPastSpace =

;

305 if

(

unsigned

NLSize =

isEOL

(FirstAfterBackslashPastSpace, End)) {

308 First

= FirstAfterBackslashPastSpace + NLSize - 1;

321

assert(Len &&

"expected newline"

);

327 return

- (

int

)EOLLen - 1) ==

'\\'

;

345 if

(

[-1] !=

'\\'

)

354

assert(

[0] ==

'/'

[1] ==

'/'

);

360

assert(

[0] ==

'/'

[1] ==

'*'

);

361 if

(End -

< 4) {

366 if

(

[-1] ==

'*'

[0] ==

'/'

) {

375 const char

const

Cur,

376 const char

const

End) {

377

assert(*Cur ==

'\''

"expected quotation character"

);

385 char

Prev = *(Cur - 1);

386 if

(Prev ==

'L'

|| Prev ==

'U'

|| Prev ==

'u'

)

388 if

(Prev ==

'8'

&& (Cur - 1 != Start) && *(Cur - 2) ==

'u'

)

396void

Scanner::skipLine(

const char

const char

const

End) {

398

assert(

<= End);

406 const char

*Start =

;

409 if

'"'

411

LastTokenPtr =

;

421

LastTokenPtr =

;

426 if

(

[1] ==

'/'

) {

432 if

(

[1] !=

'*'

) {

433

LastTokenPtr =

;

451void

Scanner::skipDirective(StringRef Name,

const char

452 const char

const

End) {

453 if

(llvm::StringSwitch<bool>(Name)

454

.Case(

"warning"

true

)

455

.Case(

"error"

true

)

460

skipLine(

, End);

465

assert(

<= End);

477 if

(

[0] !=

'/'

)

481 if

(

[1] ==

'/'

) {

487 if

(

[1] !=

'*'

)

496 const char

const

End) {

497 const char

*DirectiveLoc = Input.data() + CurDirToks.front().Offset;

500 if

(Tok.

(tok::eof))

503

diag::err_dep_source_scanner_missing_semi_after_at_import);

504 if

(Tok.

(tok::semi))

513

DirectiveLoc, diag::err_dep_source_scanner_unexpected_tokens_at_import);

519 const char

const

End) {

521

TheLexer.LexFromRawLexer(Tok);

522 First

= Input.data() + TheLexer.getCurrentBufferOffset();

523

assert(

<= End);

525 unsigned

Offset = TheLexer.getCurrentBufferOffset() - Tok.

getLength

();

528 return

CurDirToks.back();

532

Scanner::lexIncludeFilename(

const char

const char

const

End) {

534

TheLexer.LexIncludeFilename(Tok);

535 First

= Input.data() + TheLexer.getCurrentBufferOffset();

536

assert(

<= End);

538 unsigned

Offset = TheLexer.getCurrentBufferOffset() - Tok.

getLength

();

541 return

CurDirToks.back();

544void

Scanner::lexPPDirectiveBody(

const char

const char

const

End) {

547 if

(Tok.

(tok::eod) || Tok.

(tok::eof))

555 if

(LLVM_LIKELY(!NeedsCleaning))

559

Spelling.resize(Tok.

Length

);

564 unsigned

SpellingLength = 0;

565 const char

*BufPtr = Input.begin() + Tok.

Offset

;

566 const char

*AfterIdent = Input.begin() + Tok.

getEnd

();

567 while

(BufPtr < AfterIdent) {

569

Spelling[SpellingLength++] = Char;

573 return

SplitIds.try_emplace(StringRef(Spelling.begin(), SpellingLength), 0)

577

std::optional<StringRef>

578

Scanner::tryLexIdentifierOrSkipLine(

const char

const char

const

End) {

580 if

(Tok.

isNot

(tok::raw_identifier)) {

581 if

(!Tok.

(tok::eod))

582

skipLine(

, End);

586 return

cleanStringIfNeeded(Tok);

589

StringRef Scanner::lexIdentifier(

const char

const char

const

End) {

590

std::optional<StringRef>

= tryLexIdentifierOrSkipLine(

, End);

591

assert(

"expected identifier token"

);

595bool

Scanner::isNextIdentifierOrSkipLine(StringRef

const char

596 const char

const

End) {

597 if

(std::optional<StringRef> FoundId =

598

tryLexIdentifierOrSkipLine(

, End)) {

601

skipLine(

, End);

607 const char

const

End) {

611

skipLine(

, End);

615

std::optional<StringRef>

616

Scanner::tryLexStringLiteralOrSkipLine(

const char

617 const char

const

End) {

620 if

(!Tok.

(tok::eod))

621

skipLine(

, End);

625 return

cleanStringIfNeeded(Tok);

628bool

Scanner::lexAt(

const char

const char

const

End) {

633

assert(AtTok.

(tok::at));

636 if

(!isNextIdentifierOrSkipLine(

"import"

, End))

641bool

Scanner::lexModule(

const char

const char

const

End) {

642

StringRef

= lexIdentifier(

, End);

643 bool

Export =

false

;

644 if

(

"export"

) {

646

std::optional<StringRef> NextId = tryLexIdentifierOrSkipLine(

, End);

652 if

(

"module"

"import"

) {

653

skipLine(

, End);

665 if

(

"module"

) {

666

skipLine(

, End);

670

(void)lexToken(

, End);

671 if

(!tryLexIdentifierOrSkipLine(

, End))

680

skipLine(

, End);

685

TheLexer.seek(getOffsetAt(

false

);

688 if

(

"module"

)

693 return

lexModuleDirectiveBody(Kind,

, End);

696bool

Scanner::lex_Pragma(

const char

const char

const

End) {

697 if

(!isNextTokenOrSkipLine(tok::l_paren,

, End))

700

std::optional<StringRef> Str = tryLexStringLiteralOrSkipLine(

, End);

702 if

(!Str || !isNextTokenOrSkipLine(tok::r_paren,

, End))

712 const char

= Buffer.c_str();

713

Scanner PragmaScanner{StringRef(

, Buffer.size()), DiscardTokens, Diags,

716

PragmaScanner.TheLexer.setParsingPreprocessorDirective(

true

);

717 if

(PragmaScanner.lexPragma(

, Buffer.end()))

722

skipLine(

, End);

726

assert(

== Buffer.end());

731bool

Scanner::lexPragma(

const char

const char

const

End) {

732

std::optional<StringRef> FoundId = tryLexIdentifierOrSkipLine(

, End);

736

StringRef

= *FoundId;

737 auto Kind

= llvm::StringSwitch<DirectiveKind>(

)

744

lexPPDirectiveBody(

, End);

749 if

(

"clang"

) {

750

skipLine(

, End);

754

FoundId = tryLexIdentifierOrSkipLine(

, End);

760 if

(

"system_header"

) {

761

lexPPDirectiveBody(

, End);

766 if

(

"module"

) {

767

skipLine(

, End);

772 if

(!isNextIdentifierOrSkipLine(

"import"

, End))

776

lexPPDirectiveBody(

, End);

781bool

Scanner::lexEndif(

const char

const char

const

End) {

783 if

(topDirective() ==

pp_else

)

794

skipLine(

, End);

802 const char

const

End) {

803

lexPPDirectiveBody(

, End);

821bool

Scanner::lexPPLine(

const char

const char

const

End) {

822

assert(

!= End);

825

assert(

<= End);

830

skipLine(

, End);

831

assert(

<= End);

835

LastTokenPtr =

;

837

TheLexer.seek(getOffsetAt(

true

);

839 auto

ScEx1 = make_scope_exit([&]() {

847 return

lexAt(

, End);

850 return

lexModule(

, End);

852 if

'_'

) {

853 if

(isNextIdentifierOrSkipLine(

"_Pragma"

, End))

854 return

lex_Pragma(

, End);

860

TheLexer.setParsingPreprocessorDirective(

true

);

861 auto

ScEx2 = make_scope_exit(

862

[&]() { TheLexer.setParsingPreprocessorDirective(

false

); });

866 if

(HashTok.is(tok::hashhash)) {

870

skipLine(

, End);

871

assert(

<= End);

874

assert(HashTok.is(tok::hash));

877

std::optional<StringRef> FoundId = tryLexIdentifierOrSkipLine(

, End);

881

StringRef

= *FoundId;

883 if

(

"pragma"

)

884 return

lexPragma(

, End);

886 auto Kind

= llvm::StringSwitch<DirectiveKind>(

)

893

.Case(

"if"

pp_if

)

903

skipDirective(

, End);

908 return

lexEndif(

, End);

916 if

(lexIncludeFilename(

, End).is(tok::eod)) {

925 return

lexDefault(Kind,

, End);

929 if

((End -

) >= 3 &&

[0] ==

'\xef'

[1] ==

'\xbb'

930 First

[2] ==

'\xbf'

)

934bool

Scanner::scanImpl(

const char

const char

const

End) {

936 while

(

!= End)

937 if

(lexPPLine(

, End))

943 bool Error

= scanImpl(Input.begin(), Input.end());

948

(Tokens.empty() || LastTokenPtr > Input.begin() + Tokens.back().Offset))

954 for

(

const

DirectiveWithTokens &DirWithToks : DirsWithToks) {

955

assert(RemainingTokens.size() >= DirWithToks.NumTokens);

956

Directives.emplace_back(DirWithToks.Kind,

957

RemainingTokens.take_front(DirWithToks.NumTokens));

958

RemainingTokens = RemainingTokens.drop_front(DirWithToks.NumTokens);

960

assert(RemainingTokens.empty());

969 return

Scanner(Input, Tokens, Diags, InputSourceLoc).scan(Directives);

975

llvm::raw_ostream &OS) {

977 auto

needsSpaceSeparator =

980 if

(Prev == Tok.

)

981 return

!Tok.

(tok::l_paren, tok::r_paren, tok::l_square,

983 if

(Prev == tok::raw_identifier &&

984

Tok.

(tok::hash, tok::numeric_constant, tok::string_literal,

985

tok::char_constant, tok::header_name))

987 if

(Prev == tok::r_paren &&

988

Tok.

(tok::raw_identifier, tok::hash, tok::string_literal,

989

tok::char_constant, tok::unknown))

991 if

(Prev == tok::comma &&

992

Tok.

(tok::l_paren, tok::string_literal, tok::less))

999

OS <<

"<TokBeforeEOF>"

;

1000

std::optional<tok::TokenKind> PrevTokenKind;

1002 if

(PrevTokenKind && needsSpaceSeparator(*PrevTokenKind, Tok))

1004

PrevTokenKind = Tok.