-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathiwyu_lexer_utils.cc
149 lines (132 loc) · 4.85 KB
/
iwyu_lexer_utils.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
//===--- iwyu_lexer_utils.cc - clang-lexer utilities for iwyu -------------===//
//
// The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
#include "iwyu_lexer_utils.h"
#include <string.h>
#include <string>
#include <vector>
#include "iwyu_verrs.h"
#include "port.h"
#include "llvm/Support/raw_ostream.h"
#include "clang/Basic/LangOptions.h"
#include "clang/Basic/SourceLocation.h"
#include "clang/Basic/SourceManager.h"
#include "clang/Lex/Lexer.h"
#include "clang/Lex/Token.h"
using clang::Lexer;
using clang::LangOptions;
using clang::SourceLocation;
using clang::SourceManager;
using clang::SourceRange;
using clang::Token;
using std::string;
using std::vector;
namespace include_what_you_use {
// SourceManagerCharacterDataGetter method implementations.
SourceManagerCharacterDataGetter::SourceManagerCharacterDataGetter(
const SourceManager& source_manager)
: source_manager_(source_manager) {
}
const char* SourceManagerCharacterDataGetter::GetCharacterData(
SourceLocation loc) const {
bool invalid;
const char* data = source_manager_.getCharacterData(loc, &invalid);
CHECK_(!invalid);
CHECK_(data);
return data;
}
string GetSourceTextUntilEndOfLine(
SourceLocation start_loc,
const CharacterDataGetterInterface& data_getter) {
const char* data = data_getter.GetCharacterData(start_loc);
const char* line_end = strchr(data, '\n');
if (!line_end)
return data;
return string(data, line_end - data);
}
SourceLocation GetLocationAfter(
SourceLocation start_loc, const string& needle,
const CharacterDataGetterInterface& data_getter) {
CHECK_(start_loc.isValid() && "GetLocationAfter takes only valid locations");
const char* data = data_getter.GetCharacterData(start_loc);
const char* needle_loc = strstr(data, needle.c_str());
if (!needle_loc)
return SourceLocation(); // invalid source location
return start_loc.getLocWithOffset(needle_loc - data + needle.length());
}
string GetIncludeNameAsTyped(SourceLocation include_loc,
const CharacterDataGetterInterface& data_getter) {
const string data = GetSourceTextUntilEndOfLine(include_loc, data_getter);
if (data.empty())
return data;
string::size_type endpos = string::npos;
if (data[0] == '<') {
endpos = data.find('>', 1);
} else if (data[0] == '"') {
endpos = data.find('"', 1);
} else {
CHECK_UNREACHABLE_("Unexpected token being #included");
}
CHECK_(endpos != string::npos && "No end-character found for #include");
return data.substr(0, endpos+1);
}
// Get the text of a given token.
string GetTokenText(const Token& token,
const CharacterDataGetterInterface& data_getter) {
const char* text = data_getter.GetCharacterData(token.getLocation());
return string(text, token.getLength());
}
// Given the range of an #if or #elif statement, determine the
// symbols which are arguments to "defined". This allows iwyu to
// treat these symbols as if #ifdef was used instead.
vector<Token> FindArgumentsToDefined(
SourceRange range,
const CharacterDataGetterInterface& data_getter) {
const char* text = data_getter.GetCharacterData(range.getBegin());
const char* text_end = data_getter.GetCharacterData(range.getEnd());
// Ugh. The lexer wants the text to be nul-terminated. Make a copy.
const unsigned range_length = text_end - text;
const string range_str(text, range_length);
const char* range_cstr = range_str.c_str();
VERRS(7) << "Lexing: " << range_str << "\n";
Lexer lexer(range.getBegin(), LangOptions(), range_cstr, range_cstr,
range_cstr + range_length);
vector<Token> ret;
Token token;
enum { kLookingForDefined,
kExpectingLeftParenOrDefinedIdentifier,
kExpectingDefinedIdentifier } state = kLookingForDefined;
while (!lexer.LexFromRawLexer(token)) {
VERRS(7) << "Processing token \""
<< GetTokenText(token, data_getter)
<< "\" of type " << token.getName()
<< " in state " << state << "\n";
switch (state) {
case kLookingForDefined:
if (token.getKind() == clang::tok::raw_identifier) {
if (GetTokenText(token, data_getter) == "defined") {
state = kExpectingLeftParenOrDefinedIdentifier;
}
}
break;
case kExpectingLeftParenOrDefinedIdentifier:
if (token.getKind() == clang::tok::l_paren) {
state = kExpectingDefinedIdentifier;
continue;
}
// Fall through.
case kExpectingDefinedIdentifier:
CHECK_(token.getKind() == clang::tok::raw_identifier);
ret.push_back(token);
state = kLookingForDefined;
break;
}
}
return ret;
}
} // namespace include_what_you_use