//===--- RewriteTest.cpp - Playground for the code rewriter ---------------===// // // The LLVM Compiler Infrastructure // // This file was developed by Chris Lattner and is distributed under the // University of Illinois Open Source License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // Hacks and fun related to the code rewriter. // //===----------------------------------------------------------------------===// #include "ASTConsumers.h" #include "clang/Rewrite/Rewriter.h" #include "clang/AST/AST.h" #include "clang/AST/ASTConsumer.h" #include "clang/Basic/SourceManager.h" using namespace clang; namespace { class RewriteTest : public ASTConsumer { Rewriter Rewrite; ASTContext *Context; SourceManager *SM; unsigned MainFileID; SourceLocation LastIncLoc; llvm::SmallVector ClassImplementation; llvm::SmallVector CategoryImplementation; static const int OBJC_ABI_VERSION =7 ; public: void Initialize(ASTContext &context, unsigned mainFileID) { Context = &context; SM = &Context->SourceMgr; MainFileID = mainFileID; Rewrite.setSourceMgr(Context->SourceMgr); } virtual void HandleTopLevelDecl(Decl *D); void HandleDeclInMainFile(Decl *D); void RewriteInclude(SourceLocation Loc); void RewriteFunctionBody(Stmt *S); void RewriteAtEncode(ObjCEncodeExpr *Exp); void WriteObjcClassMetaData(ObjcImplementationDecl *IDecl); void WriteObjcMetaData(); ~RewriteTest(); }; } ASTConsumer *clang::CreateCodeRewriterTest() { return new RewriteTest(); } void RewriteTest::HandleTopLevelDecl(Decl *D) { // Two cases: either the decl could be in the main file, or it could be in a // #included file. If the former, rewrite it now. If the later, check to see // if we rewrote the #include/#import. SourceLocation Loc = D->getLocation(); Loc = SM->getLogicalLoc(Loc); // If this is for a builtin, ignore it. if (Loc.isInvalid()) return; if (SM->getDecomposedFileLoc(Loc).first == MainFileID) return HandleDeclInMainFile(D); RewriteInclude(Loc); } void RewriteTest::RewriteInclude(SourceLocation Loc) { // Rip up the #include stack to the main file. SourceLocation IncLoc = Loc, NextLoc = Loc; do { IncLoc = Loc; Loc = SM->getLogicalLoc(NextLoc); NextLoc = SM->getIncludeLoc(Loc); } while (!NextLoc.isInvalid()); // Loc is now the location of the #include filename "foo" or . // IncLoc indicates the header that was included if it is useful. IncLoc = SM->getLogicalLoc(IncLoc); if (SM->getDecomposedFileLoc(Loc).first != MainFileID || Loc == LastIncLoc) return; LastIncLoc = Loc; unsigned IncCol = SM->getColumnNumber(Loc); SourceLocation LineStartLoc = Loc.getFileLocWithOffset(-IncCol+1); // Replace the #import with #include. Rewrite.ReplaceText(LineStartLoc, IncCol-1, "#include ", strlen("#include ")); } /// HandleDeclInMainFile - This is called for each top-level decl defined in the /// main file of the input. void RewriteTest::HandleDeclInMainFile(Decl *D) { if (FunctionDecl *FD = dyn_cast(D)) if (Stmt *Body = FD->getBody()) RewriteFunctionBody(Body); if (ObjcImplementationDecl *CI = dyn_cast(D)) ClassImplementation.push_back(CI); else if (ObjcCategoryImplDecl *CI = dyn_cast(D)) CategoryImplementation.push_back(CI); // Nothing yet. } void RewriteTest::RewriteFunctionBody(Stmt *S) { // Handle specific things. if (ObjCEncodeExpr *AtEncode = dyn_cast(S)) return RewriteAtEncode(AtEncode); // Otherwise, just rewrite all children. for (Stmt::child_iterator CI = S->child_begin(), E = S->child_end(); CI != E; ++CI) if (*CI) RewriteFunctionBody(*CI); } void RewriteTest::RewriteAtEncode(ObjCEncodeExpr *Exp) { // Create a new string expression. QualType StrType = Context->getPointerType(Context->CharTy); Expr *Replacement = new StringLiteral("foo", 3, false, StrType, SourceLocation(), SourceLocation()); Rewrite.ReplaceStmt(Exp, Replacement); delete Replacement; } void RewriteTest::WriteObjcClassMetaData(ObjcImplementationDecl *IDecl) { ObjcInterfaceDecl *CDecl = IDecl->getClassInterface(); // Build _objc_ivar_list metadata for classes ivars if needed if (IDecl->getImplDeclNumIvars() > 0 || CDecl&& CDecl->getIntfDeclNumIvars() > 0) { static bool objc_ivar = false; int NumIvars = IDecl->getImplDeclNumIvars() > 0 ? IDecl->getImplDeclNumIvars() : CDecl->getIntfDeclNumIvars(); if (!objc_ivar) { /* struct _objc_ivar { char *ivar_name; char *ivar_type; int ivar_offset; }; */ printf("\nstruct _objc_ivar {\n"); printf("\tchar *ivar_name;\n"); printf("\tchar *ivar_type;\n"); printf("\tint ivar_offset;\n"); printf("};\n"); objc_ivar = true; } /* struct _objc_ivar_list { int ivar_count; struct _objc_ivar ivar_list[ivar_count]; }; */ printf("\nstatic struct {\n"); printf("\tint ivar_count;\n"); printf("\tstruct _objc_ivar ivar_list[%d];\n", NumIvars); printf("} _OBJC_INSTANCE_VARIABLES_%s " "__attribute__ ((section (\"__OBJC, __instance_vars\")))= " "{\n\t%d\n",IDecl->getName(), NumIvars); ObjcIvarDecl **Ivars = IDecl->getImplDeclIVars() ? IDecl->getImplDeclIVars() : CDecl->getIntfDeclIvars(); for (int i = 0; i < NumIvars; i++) // TODO: 1) ivar names may have to go to another section. 2) encode // ivar_type type of each ivar . 3) compute and add ivar offset. printf("\t,\"%s\", \"\", 0\n", Ivars[i]->getName()); printf("};\n"); } // Build _objc_method for class's instance or class methods metadata if needed static bool objc_impl_method = false; if (IDecl->getNumInstanceMethods() > 0 || IDecl->getNumClassMethods() > 0) { if (!objc_impl_method) { /* struct _objc_method { SEL _cmd; char *method_types; void *_imp; } */ printf("\nstruct _objc_method {\n"); printf("\tSEL _cmd;\n"); printf("\tchar *method_types;\n"); printf("\tvoid *_imp;\n"); printf("};\n"); objc_impl_method = true; } } // Build _objc_method_list for class's instance methods if needed if (IDecl->getNumInstanceMethods() > 0) { int NumMethods = IDecl->getNumInstanceMethods(); /* struct _objc_method_list { struct objc_method_list *next_method; int method_count; struct _objc_method method_list[method_count]; } */ printf("\nstatic struct {\n"); printf("\tstruct objc_method_list *next_method;\n"); printf("\tint method_count;\n"); printf("\tstruct _objc_method method_list[%d];\n", NumMethods); printf("} _OBJC_INSTANCE_METHODS_%s " "__attribute__ ((section (\"__OBJC, __inst_meth\")))= " "{\n\t0, %d\n", IDecl->getName(), NumMethods); ObjcMethodDecl **Methods = IDecl->getInstanceMethods(); for (int i = 0; i < NumMethods; i++) // TODO: 1) method selector name may hav to go into their own section // 2) encode method types for use here (which may have to go into // __meth_var_types section, 3) Need method address as 3rd initializer. printf("\t,(SEL)\"%s\", \"\", 0\n", Methods[i]->getSelector().getName().c_str()); printf("};\n"); } // Build _objc_method_list for class's class methods if needed if (IDecl->getNumClassMethods() > 0) { int NumMethods = IDecl->getNumClassMethods(); /* struct _objc_method_list { struct objc_method_list *next_method; int method_count; struct _objc_method method_list[method_count]; } */ printf("\nstatic struct {\n"); printf("\tstruct objc_method_list *next_method;\n"); printf("\tint method_count;\n"); printf("\tstruct _objc_method method_list[%d];\n", NumMethods); printf("} _OBJC_CLASS_METHODS_%s " "__attribute__ ((section (\"__OBJC, __cls_meth\")))= " "{\n\t0, %d\n", IDecl->getName(), NumMethods); ObjcMethodDecl **Methods = IDecl->getClassMethods(); for (int i = 0; i < NumMethods; i++) // TODO: 1) method selector name may hav to go into their own section // 2) encode method types for use here (which may have to go into // __meth_var_types section, 3) Need method address as 3rd initializer. printf("\t,(SEL)\"%s\", \"\", 0\n", Methods[i]->getSelector().getName().c_str()); printf("};\n"); } // Protocols referenced in class declaration? static bool objc_protocol_methods = false; int NumProtocols = CDecl->getNumIntfRefProtocols(); if (NumProtocols > 0) { ObjcProtocolDecl **Protocols = CDecl->getReferencedProtocols(); for (int i = 0; i < NumProtocols; i++) { ObjcProtocolDecl *PDecl = Protocols[i]; // Output struct protocol_methods holder of method selector and type. if (!objc_protocol_methods && (PDecl->getNumInstanceMethods() > 0 || PDecl->getNumClassMethods() > 0)) { /* struct protocol_methods { SEL _cmd; char *method_types; } */ printf("\nstruct protocol_methods {\n"); printf("\tSEL _cmd;\n"); printf("\tchar *method_types;\n"); printf("};\n"); objc_protocol_methods = true; } // Output instance methods declared in this protocol. /* struct _objc_protocol_method_list { int protocol_method_count; struct protocol_methods protocols[protocol_method_count]; } */ int NumMethods = PDecl->getNumInstanceMethods(); if (NumMethods > 0) { printf("\nstatic struct {\n"); printf("\tint protocol_method_count;\n"); printf("\tstruct protocol_methods protocols[%d];\n", NumMethods); printf("} _OBJC_PROTOCOL_INSTANCE_METHODS_%s " "__attribute__ ((section (\"__OBJC, __cat_inst_meth\")))= " "{\n\t%d\n",PDecl->getName(), NumMethods); ObjcMethodDecl **Methods = PDecl->getInstanceMethods(); for (int i = 0; i < NumMethods; i++) // TODO: 1) method selector name may hav to go into their own section // 2) encode method types for use here (which may have to go into // __meth_var_types section. printf("\t,(SEL)\"%s\", \"\"\n", Methods[i]->getSelector().getName().c_str()); printf("};\n"); } // Output class methods declared in this protocol. NumMethods = PDecl->getNumClassMethods(); if (NumMethods > 0) { printf("\nstatic struct {\n"); printf("\tint protocol_method_count;\n"); printf("\tstruct protocol_methods protocols[%d];\n", NumMethods); printf("} _OBJC_PROTOCOL_CLASS_METHODS_%s " "__attribute__ ((section (\"__OBJC, __cat_cls_meth\")))= " "{\n\t%d\n",PDecl->getName(), NumMethods); ObjcMethodDecl **Methods = PDecl->getClassMethods(); for (int i = 0; i < NumMethods; i++) // TODO: 1) method selector name may hav to go into their own section // 2) encode method types for use here (which may have to go into // __meth_var_types section. printf("\t,(SEL)\"%s\", \"\"\n", Methods[i]->getSelector().getName().c_str()); printf("};\n"); } // Output: /* struct _objc_protocol { // Objective-C 1.0 extensions struct _objc_protocol_extension *isa; char *protocol_name; struct _objc_protocol **protocol_list; struct _objc__method_prototype_list *instance_methods; struct _objc__method_prototype_list *class_methods; }; */ static bool objc_protocol = false; if (!objc_protocol) { printf("\nstruct _objc_protocol {\n"); printf("\tstruct _objc_protocol_extension *isa;\n"); printf("\tchar *protocol_name;\n"); printf("\tstruct _objc_protocol **protocol_list;\n"); printf("\tstruct _objc__method_prototype_list *instance_methods;\n"); printf("\tstruct _objc__method_prototype_list *class_methods;\n"); printf("};\n"); objc_protocol = true; } printf("\nstatic struct _objc_protocol _OBJC_PROTOCOL_%s " "__attribute__ ((section (\"__OBJC, __protocol\")))= " "{\n\t0, \"%s\", 0, ", PDecl->getName(), PDecl->getName()); if (PDecl->getInstanceMethods() > 0) printf("(struct _objc__method_prototype_list *)" "&_OBJC_PROTOCOL_INSTANCE_METHODS_%s, ", PDecl->getName()); else printf("0, "); if (PDecl->getClassMethods() > 0) printf("(struct _objc__method_prototype_list *)" "&_OBJC_PROTOCOL_CLASS_METHODS_%s\n", PDecl->getName()); else printf("0\n"); printf("};\n"); } } if (NumProtocols > 0) { // Output the top lovel protocol meta-data for the class. /* struct _objc_protocol_list { struct _objc_protocol_list *next; int protocol_count; struct _objc_protocol *class_protocols[protocol_count]; } */ printf("\nstatic struct {\n"); printf("\tstruct _objc_protocol_list *next;\n"); printf("\tint protocol_count;\n"); printf("\tstruct _objc_protocol *class_protocols[%d];\n" "} _OBJC_CLASS_PROTOCOLS_%s " "__attribute__ ((section (\"__OBJC, __cat_cls_meth\")))= " "{\n\t0, %d\n",NumProtocols, CDecl->getName(), NumProtocols); ObjcProtocolDecl **Protocols = CDecl->getReferencedProtocols(); for (int i = 0; i < NumProtocols; i++) { ObjcProtocolDecl *PDecl = Protocols[i]; printf("\t,&_OBJC_PROTOCOL_%s \n", PDecl->getName()); } printf("};\n"); } // Declaration of top-level metadata /* struct _objc_meta_class { const char *root_class_name; const char *super_class_name; char *name; long version; long info; long instance_size; struct objc_ivar_list *ivars; struct objc_method_list *methods; struct objc_cache *cache; struct objc_protocol_list *protocols; const char *ivar_layout; struct _objc_class_ext *ext; }; */ static bool objc_meta_class = false; if (!objc_meta_class) { printf("\nstruct _objc_class {\n"); printf("\tconst char *root_class_name;\n"); printf("\tconst char *super_class_name;\n"); printf("\tchar *name;\n"); printf("\tlong version;\n"); printf("\tlong info;\n"); printf("\tlong instance_size;\n"); printf("\tstruct objc_ivar_list *ivars;\n"); printf("\tstruct objc_method_list *methods;\n"); printf("\tstruct objc_cache *cache;\n"); printf("\tstruct objc_protocol_list *protocols;\n"); printf("\tconst char *ivar_layout;\n"); printf("\tstruct _objc_class_ext *ext;\n"); printf("};\n"); objc_meta_class = true; } // Meta-class metadata generation. ObjcInterfaceDecl *RootClass = 0; ObjcInterfaceDecl *SuperClass = CDecl->getSuperClass(); while (SuperClass) { RootClass = SuperClass; SuperClass = SuperClass->getSuperClass(); } SuperClass = CDecl->getSuperClass(); printf("\nstatic struct _objc_class _OBJC_METACLASS_%s " "__attribute__ ((section (\"__OBJC, __meta_class\")))= " "{\n\t\"%s\"", CDecl->getName(), RootClass ? RootClass->getName() : CDecl->getName()); if (SuperClass) printf(", \"%s\", \"%s\"", SuperClass->getName(), CDecl->getName()); else printf(", 0, \"%s\"", CDecl->getName()); // FIXME: better way of getting size struct _objc_class (48) // TODO: 'ivars' field for root class is currently set to 0. // 'info' field is initialized to CLS_META(2) for metaclass printf(", 0,2,48,0"); if (CDecl->getNumClassMethods() > 0) printf(", (struct objc_method_list *)&_OBJC_CLASS_METHODS_%s\n", CDecl->getName()); else printf(", 0\n"); printf("\t,0,0,0,0\n"); printf("};\n"); } void RewriteTest::WriteObjcMetaData() { int ClsDefCount = ClassImplementation.size(); int CatDefCount = CategoryImplementation.size(); if (ClsDefCount == 0 && CatDefCount == 0) return; // For each defined class, write out all its meta data. for (int i = 0; i < ClsDefCount; i++) WriteObjcClassMetaData(ClassImplementation[i]); // Write objc_symtab metadata /* struct _objc_symtab { long sel_ref_cnt; SEL *refs; short cls_def_cnt; short cat_def_cnt; void *defs[cls_def_cnt + cat_def_cnt]; }; */ printf("\nstruct _objc_symtab {\n"); printf("\tlong sel_ref_cnt;\n"); printf("\tSEL *refs;\n"); printf("\tshort cls_def_cnt;\n"); printf("\tshort cat_def_cnt;\n"); printf("\tvoid *defs[%d];\n", ClsDefCount + CatDefCount); printf("};\n\n"); printf("static struct _objc_symtab " "_OBJC_SYMBOLS __attribute__ ((section (\"__OBJC, __symbols\")))= {\n"); printf("\t0, 0, %d, %d\n", ClsDefCount, CatDefCount); for (int i = 0; i < ClsDefCount; i++) printf("\t,_OBJC_CLASS_%s\n", ClassImplementation[i]->getName()); for (int i = 0; i < CatDefCount; i++) printf("\t,_OBJC_CATEGORY_%s_%s\n", CategoryImplementation[i]->getClassInterface()->getName(), CategoryImplementation[i]->getName()); printf("};\n\n"); // Write objc_module metadata /* struct _objc_module { long version; long size; const char *name; struct _objc_symtab *symtab; } */ printf("\nstruct _objc_module {\n"); printf("\tlong version;\n"); printf("\tlong size;\n"); printf("\tconst char *name;\n"); printf("\tstruct _objc_symtab *symtab;"); printf("};\n\n"); printf("static struct _objc_module " "_OBJC_MODULES __attribute__ ((section (\"__OBJC, __module_info\")))= {\n"); printf("\t%d, %d, \"\", &_OBJC_SYMBOLS\n", OBJC_ABI_VERSION, 16); printf("};\n\n"); } RewriteTest::~RewriteTest() { // Get the top-level buffer that this corresponds to. std::pair MainBuf = SM->getBufferData(MainFileID); const char *MainBufStart = MainBuf.first; const char *MainBufEnd = MainBuf.second; // Loop over the whole file, looking for tabs. for (const char *BufPtr = MainBufStart; BufPtr != MainBufEnd; ++BufPtr) { if (*BufPtr != '\t') continue; // Okay, we found a tab. This tab will turn into at least one character, // but it depends on which 'virtual column' it is in. Compute that now. unsigned VCol = 0; while (BufPtr-VCol != MainBufStart && BufPtr[-VCol-1] != '\t' && BufPtr[-VCol-1] != '\n' && BufPtr[-VCol-1] != '\r') ++VCol; // Okay, now that we know the virtual column, we know how many spaces to // insert. We assume 8-character tab-stops. unsigned Spaces = 8-(VCol & 7); // Get the location of the tab. SourceLocation TabLoc = SourceLocation::getFileLoc(MainFileID, BufPtr-MainBufStart); // Rewrite the single tab character into a sequence of spaces. Rewrite.ReplaceText(TabLoc, 1, " ", Spaces); } // Get the buffer corresponding to MainFileID. If we haven't changed it, then // we are done. if (const RewriteBuffer *RewriteBuf = Rewrite.getRewriteBufferFor(MainFileID)) { printf("Changed:\n"); std::string S(RewriteBuf->begin(), RewriteBuf->end()); printf("%s\n", S.c_str()); } else { printf("No changes\n"); } // Rewrite Objective-c meta data* WriteObjcMetaData(); }