-
Notifications
You must be signed in to change notification settings - Fork 50
/
Copy pathcomment.cc
406 lines (356 loc) · 12.3 KB
/
comment.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "comment.hh"
#include "funcdata.hh"
namespace ghidra {
ElementId ELEM_COMMENT = ElementId("comment",86);
ElementId ELEM_COMMENTDB = ElementId("commentdb",87);
ElementId ELEM_TEXT = ElementId("text",88);
/// \param tp is the set of properties to associate with the comment (or 0 for no properties)
/// \param fad is the Address of the function containing the comment
/// \param ad is the Address of the instruction associated with the comment
/// \param uq is used internally to sub-sort comments at the same address
/// \param txt is the body of the comment
Comment::Comment(uint4 tp,const Address &fad,const Address &ad,int4 uq,const string &txt) :
type(tp), uniq(uq), funcaddr(fad), addr(ad), text(txt), emitted(false)
{
}
/// The single comment is encoded as a \<comment> element.
/// \param encoder is the stream encoder
void Comment::encode(Encoder &encoder) const
{
string tpname = Comment::decodeCommentType(type);
encoder.openElement(ELEM_COMMENT);
encoder.writeString(ATTRIB_TYPE, tpname);
encoder.openElement(ELEM_ADDR);
funcaddr.getSpace()->encodeAttributes(encoder,funcaddr.getOffset());
encoder.closeElement(ELEM_ADDR);
encoder.openElement(ELEM_ADDR);
addr.getSpace()->encodeAttributes(encoder,addr.getOffset());
encoder.closeElement(ELEM_ADDR);
encoder.openElement(ELEM_TEXT);
encoder.writeString(ATTRIB_CONTENT, text);
encoder.closeElement(ELEM_TEXT);
encoder.closeElement(ELEM_COMMENT);
}
/// Parse a \<comment> element from the given stream decoder
/// \param decoder is the given stream decoder
void Comment::decode(Decoder &decoder)
{
emitted = false;
type = 0;
uint4 elemId = decoder.openElement(ELEM_COMMENT);
type = Comment::encodeCommentType(decoder.readString(ATTRIB_TYPE));
funcaddr = Address::decode(decoder);
addr = Address::decode(decoder);
uint4 subId = decoder.peekElement();
if (subId != 0) {
decoder.openElement();
text = decoder.readString(ATTRIB_CONTENT);
decoder.closeElement(subId);
}
decoder.closeElement(elemId);
}
/// \param name is a string representation of a single comment property
/// \return the enumerated property type
uint4 Comment::encodeCommentType(const string &name)
{
if (name == "user1")
return Comment::user1;
if (name == "user2")
return Comment::user2;
if (name == "user3")
return Comment::user3;
if (name == "header")
return Comment::header;
if (name == "warning")
return Comment::warning;
if (name == "warningheader")
return Comment::warningheader;
throw LowlevelError("Unknown comment type: "+name);
}
/// \param val is a single comment property
/// \return the string representation of the property
string Comment::decodeCommentType(uint4 val)
{
switch(val) {
case user1:
return "user1";
case user2:
return "user2";
case user3:
return "user3";
case header:
return "header";
case warning:
return "warning";
case warningheader:
return "warningheader";
default:
break;
}
throw LowlevelError("Unknown comment type");
}
/// \param a is the first Comment to compare
/// \param b is the second
/// \return \b true is the first is ordered before the second
bool CommentOrder::operator()(const Comment *a,const Comment *b) const
{
if (a->getFuncAddr() != b->getFuncAddr())
return (a->getFuncAddr() < b->getFuncAddr());
if (a->getAddr() != b->getAddr())
return (a->getAddr() < b->getAddr());
if (a->getUniq() != b->getUniq())
return (a->getUniq() < b->getUniq());
return false;
}
CommentDatabaseInternal::CommentDatabaseInternal(void)
: CommentDatabase()
{
}
CommentDatabaseInternal::~CommentDatabaseInternal(void)
{
CommentSet::iterator iter;
for(iter=commentset.begin();iter!=commentset.end();++iter)
delete *iter;
}
void CommentDatabaseInternal::clear(void)
{
CommentSet::iterator iter;
for(iter=commentset.begin();iter!=commentset.end();++iter)
delete *iter;
commentset.clear();
}
void CommentDatabaseInternal::clearType(const Address &fad,uint4 tp)
{
Comment testcommbeg(0,fad,Address(Address::m_minimal),0,"");
Comment testcommend(0,fad,Address(Address::m_maximal),65535,"");
CommentSet::iterator iterbegin = commentset.lower_bound(&testcommbeg);
CommentSet::iterator iterend = commentset.lower_bound(&testcommend);
CommentSet::iterator iter;
while(iterbegin != iterend) {
iter = iterbegin;
++iter;
if (((*iterbegin)->getType()&tp)!=0) {
delete (*iterbegin);
commentset.erase(iterbegin);
}
iterbegin = iter;
}
}
void CommentDatabaseInternal::addComment(uint4 tp,const Address &fad,
const Address &ad,
const string &txt)
{
Comment *newcom = new Comment(tp,fad,ad,65535,txt);
// Find first element greater
CommentSet::iterator iter = commentset.lower_bound(newcom);
// turn into last element less than
if (iter != commentset.begin())
--iter;
newcom->uniq = 0;
if (iter != commentset.end()) {
if (((*iter)->getAddr() == ad)&&((*iter)->getFuncAddr()==fad))
newcom->uniq = (*iter)->getUniq() + 1;
}
commentset.insert(newcom);
}
bool CommentDatabaseInternal::addCommentNoDuplicate(uint4 tp,const Address &fad,
const Address &ad,const string &txt)
{
Comment *newcom = new Comment(tp,fad,ad,65535,txt);
// Find first element greater
CommentSet::iterator iter = commentset.lower_bound(newcom);
newcom->uniq = 0; // Set the uniq AFTER the search
while(iter != commentset.begin()) {
--iter;
if (((*iter)->getAddr()==ad)&&((*iter)->getFuncAddr()==fad)) {
if ((*iter)->getText() == txt) { // Matching text, don't store it
delete newcom;
return false;
}
if (newcom->uniq == 0)
newcom->uniq = (*iter)->getUniq() + 1;
}
else
break;
}
commentset.insert(newcom);
return true;
}
void CommentDatabaseInternal::deleteComment(Comment *com)
{
commentset.erase(com);
delete com;
}
CommentSet::const_iterator CommentDatabaseInternal::beginComment(const Address &fad) const
{
Comment testcomm(0,fad,Address(Address::m_minimal),0,"");
return commentset.lower_bound(&testcomm);
}
CommentSet::const_iterator CommentDatabaseInternal::endComment(const Address &fad) const
{
Comment testcomm(0,fad,Address(Address::m_maximal),65535,"");
return commentset.lower_bound(&testcomm);
}
void CommentDatabaseInternal::encode(Encoder &encoder) const
{
CommentSet::const_iterator iter;
encoder.openElement(ELEM_COMMENTDB);
for(iter=commentset.begin();iter!=commentset.end();++iter)
(*iter)->encode(encoder);
encoder.closeElement(ELEM_COMMENTDB);
}
void CommentDatabaseInternal::decode(Decoder &decoder)
{
uint4 elemId = decoder.openElement(ELEM_COMMENTDB);
while(decoder.peekElement() != 0) {
Comment com;
com.decode(decoder);
addComment(com.getType(),com.getFuncAddr(),com.getAddr(),com.getText());
}
decoder.closeElement(elemId);
}
/// Figure out position of given Comment and initialize its key.
/// \param subsort is a reference to the key to be initialized
/// \param comm is the given Comment
/// \param fd is the function owning the Comment
/// \return \b true if the Comment could be positioned at all
bool CommentSorter::findPosition(Subsort &subsort,Comment *comm,const Funcdata *fd)
{
if (comm->getType() == 0) return false;
const Address &fad( fd->getAddress() );
if (((comm->getType() & (Comment::header | Comment::warningheader))!=0)&&(comm->getAddr() == fad)) {
// If it is a header comment at the address associated with the beginning of the function
subsort.setHeader(header_basic);
return true;
}
// Try to find block containing comment
// Find op at lowest address greater or equal to comment's address
PcodeOpTree::const_iterator opiter = fd->beginOp(comm->getAddr());
PcodeOp *backupOp = (PcodeOp *)0;
if (opiter != fd->endOpAll()) { // If there is an op at or after the comment
PcodeOp *op = (*opiter).second;
BlockBasic *block = op->getParent();
if (block == (BlockBasic *)0)
throw LowlevelError("Dead op reaching CommentSorter");
if (block->contains(comm->getAddr())) { // If the op's block contains the address
// Associate comment with this op
subsort.setBlock(block->getIndex(), (uint4)op->getSeqNum().getOrder());
return true;
}
if (comm->getAddr() == op->getAddr())
backupOp = op;
}
if (opiter != fd->beginOpAll()) { // If there is a previous op
--opiter;
PcodeOp *op = (*opiter).second;
BlockBasic *block = op->getParent();
if (block == (BlockBasic *)0)
throw LowlevelError("Dead op reaching CommentSorter");
if (block->contains(comm->getAddr())) { // If the op's block contains the address
// Treat the comment as being in this block at the very end
subsort.setBlock(block->getIndex(),0xffffffff);
return true;
}
}
if (backupOp != (PcodeOp *)0) {
// Its possible the op migrated from its original basic block.
// Since the address matches exactly, hang the comment on it
subsort.setBlock(backupOp->getParent()->getIndex(),(uint4)backupOp->getSeqNum().getOrder());
return true;
}
if (fd->beginOpAll() == fd->endOpAll()) { // If there are no ops at all
subsort.setBlock(0,0); // Put comment at the beginning of the first block
return true;
}
if (displayUnplacedComments) {
subsort.setHeader(header_unplaced);
return true;
}
return false; // Basic block containing comment has been excised
}
/// \brief Collect and sort comments specific to the given function.
///
/// Only keep comments matching one of a specific set of properties
/// \param tp is the set of properties (may be zero)
/// \param fd is the given function
/// \param db is the container of comments to collect from
/// \param displayUnplaced is \b true if unplaced comments should be displayed in the header
void CommentSorter::setupFunctionList(uint4 tp,const Funcdata *fd,const CommentDatabase &db,bool displayUnplaced)
{
commmap.clear();
displayUnplacedComments = displayUnplaced;
if (tp == 0) return;
const Address &fad( fd->getAddress() );
CommentSet::const_iterator iter = db.beginComment(fad);
CommentSet::const_iterator lastiter = db.endComment(fad);
Subsort subsort;
subsort.pos = 0;
while(iter != lastiter) {
Comment *comm = *iter;
if (findPosition(subsort, comm, fd)) {
comm->setEmitted(false);
commmap[ subsort ] = comm;
subsort.pos += 1; // Advance the uniqueness counter
}
++iter;
}
}
/// This will generally get called with the root p-code op of a statement
/// being emitted by the decompiler. This establishes a key value within the
/// basic block, so it is known where to stop emitting comments within the
/// block for emitting the statement.
/// \param op is the p-code representing the root of a statement
void CommentSorter::setupOpList(const PcodeOp *op)
{
if (op == (const PcodeOp *)0) { // If NULL op
opstop = stop; // pick up any remaining comments in this basic block
return;
}
Subsort subsort;
subsort.index = op->getParent()->getIndex();
subsort.order = (uint4)op->getSeqNum().getOrder();
subsort.pos = 0xffffffff;
opstop = commmap.upper_bound(subsort);
}
/// Find iterators that bound everything in the basic block
///
/// \param bl is the basic block
void CommentSorter::setupBlockList(const FlowBlock *bl)
{
Subsort subsort;
subsort.index = bl->getIndex();
subsort.order = 0;
subsort.pos = 0;
start = commmap.lower_bound(subsort);
subsort.order = 0xffffffff;
subsort.pos = 0xffffffff;
stop = commmap.upper_bound(subsort);
}
/// Header comments are grouped together. Set up iterators.
/// \param headerType selects either \b header_basic or \b header_unplaced comments
void CommentSorter::setupHeader(uint4 headerType)
{
Subsort subsort;
subsort.index = -1;
subsort.order = headerType;
subsort.pos = 0;
start = commmap.lower_bound(subsort);
subsort.pos = 0xffffffff;
opstop = commmap.upper_bound(subsort);
}
} // End namespace ghidra