2005-11-22 12:26:26 +00:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2000, Jesus Castagnetto <jmcastagnetto@zkey.com>
|
|
|
|
*
|
|
|
|
* This source code is released for free distribution under the terms of the
|
|
|
|
* GNU General Public License.
|
|
|
|
*
|
|
|
|
* This module contains functions for generating tags for the PHP web page
|
|
|
|
* scripting language. Only recognizes functions and classes, not methods or
|
|
|
|
* variables.
|
|
|
|
*
|
|
|
|
* Parsing PHP defines by Pavel Hlousek <pavel.hlousek@seznam.cz>, Apr 2003.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* INCLUDE FILES
|
|
|
|
*/
|
2007-07-09 15:11:18 +00:00
|
|
|
#include "general.h" /* must always come first */
|
2005-11-22 12:26:26 +00:00
|
|
|
|
|
|
|
#include <string.h>
|
2010-03-07 16:50:20 +00:00
|
|
|
#include "main.h"
|
2005-11-22 12:26:26 +00:00
|
|
|
#include "parse.h"
|
|
|
|
#include "read.h"
|
|
|
|
#include "vstring.h"
|
|
|
|
|
|
|
|
/*
|
|
|
|
* DATA DEFINITIONS
|
|
|
|
*/
|
|
|
|
typedef enum {
|
2007-07-09 15:11:18 +00:00
|
|
|
K_CLASS, K_DEFINE, K_FUNCTION, K_VARIABLE
|
2005-11-22 12:26:26 +00:00
|
|
|
} phpKind;
|
|
|
|
|
2007-11-17 19:27:50 +00:00
|
|
|
#if 0
|
2005-11-22 12:26:26 +00:00
|
|
|
static kindOption PhpKinds [] = {
|
2007-07-09 15:11:18 +00:00
|
|
|
{ TRUE, 'c', "class", "classes" },
|
2007-11-17 19:27:50 +00:00
|
|
|
{ TRUE, 'd', "define", "constant definitions" },
|
2007-07-09 15:11:18 +00:00
|
|
|
{ TRUE, 'f', "function", "functions" },
|
|
|
|
{ TRUE, 'v', "variable", "variables" }
|
2005-11-22 12:26:26 +00:00
|
|
|
};
|
2007-11-17 19:27:50 +00:00
|
|
|
#endif
|
2005-11-22 12:26:26 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* FUNCTION DEFINITIONS
|
|
|
|
*/
|
2007-11-17 19:27:50 +00:00
|
|
|
|
|
|
|
/* JavaScript patterns are duplicated in jscript.c */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Cygwin doesn't support non-ASCII characters in character classes.
|
|
|
|
* This isn't a good solution to the underlying problem, because we're still
|
|
|
|
* making assumptions about the character encoding.
|
|
|
|
* Really, these regular expressions need to concentrate on what marks the
|
|
|
|
* end of an identifier, and we need something like iconv to take into
|
|
|
|
* account the user's locale (or an override on the command-line.)
|
|
|
|
*/
|
2007-11-18 17:17:59 +00:00
|
|
|
/*
|
2007-11-17 19:27:50 +00:00
|
|
|
#ifdef __CYGWIN__
|
|
|
|
#define ALPHA "[:alpha:]"
|
|
|
|
#define ALNUM "[:alnum:]"
|
|
|
|
#else
|
|
|
|
#define ALPHA "A-Za-z\x7f-\xff"
|
|
|
|
#define ALNUM "0-9A-Za-z\x7f-\xff"
|
|
|
|
#endif
|
2007-11-18 17:17:59 +00:00
|
|
|
*/
|
2008-02-27 13:17:29 +00:00
|
|
|
/* "A-Za-z\x7f-\xff" fails on other locales than "C" and so skip it */
|
2007-11-18 17:17:59 +00:00
|
|
|
#define ALPHA "[:alpha:]"
|
|
|
|
#define ALNUM "[:alnum:]"
|
|
|
|
|
2010-03-07 16:50:20 +00:00
|
|
|
static void function_cb(const char *line, const regexMatch *matches, unsigned int count);
|
2007-11-17 19:27:50 +00:00
|
|
|
|
|
|
|
static void installPHPRegex (const langType language)
|
|
|
|
{
|
2009-09-20 19:06:48 +00:00
|
|
|
addTagRegex(language, "^[ \t]*((final|abstract)[ \t]+)*class[ \t]+([" ALPHA "_][" ALNUM "_]*)",
|
|
|
|
"\\3", "c,class,classes", NULL);
|
|
|
|
addTagRegex(language, "^[ \t]*interface[ \t]+([" ALPHA "_][" ALNUM "_]*)",
|
|
|
|
"\\1", "i,interface,interfaces", NULL);
|
|
|
|
addTagRegex(language, "^[ \t]*define[ \t]*\\([ \t]*['\"]?([" ALPHA "_][" ALNUM "_]*)",
|
2009-11-23 20:42:30 +00:00
|
|
|
"\\1", "m,macro,macros", NULL);
|
|
|
|
addTagRegex(language, "^[ \t]*const[ \t]*([" ALPHA "_][" ALNUM "_]*)[ \t]*[=;]",
|
|
|
|
"\\1", "m,macro,macros", NULL);
|
2010-03-07 16:50:20 +00:00
|
|
|
addCallbackRegex(language,
|
2012-01-01 17:01:49 +00:00
|
|
|
"^[ \t]*((public|protected|private|static|final)[ \t]+)*function[ \t]+&?[ \t]*([" ALPHA "_][" ALNUM "_]*)[[:space:]]*(\\(.*\\)|\\(.*)",
|
2010-11-18 18:20:12 +00:00
|
|
|
NULL, function_cb);
|
2009-09-20 19:06:48 +00:00
|
|
|
addTagRegex(language, "^[ \t]*(\\$|::\\$|\\$this->)([" ALPHA "_][" ALNUM "_]*)[ \t]*=",
|
|
|
|
"\\2", "v,variable,variables", NULL);
|
|
|
|
addTagRegex(language, "^[ \t]*((var|public|protected|private|static)[ \t]+)+\\$([" ALPHA "_][" ALNUM "_]*)[ \t]*[=;]",
|
2007-11-17 19:27:50 +00:00
|
|
|
"\\3", "v,variable,variables", NULL);
|
|
|
|
|
|
|
|
/* function regex is covered by PHP regex */
|
|
|
|
addTagRegex (language, "(^|[ \t])([A-Za-z0-9_]+)[ \t]*[=:][ \t]*function[ \t]*\\(",
|
|
|
|
"\\2", "j,jsfunction,javascript functions", NULL);
|
|
|
|
addTagRegex (language, "(^|[ \t])([A-Za-z0-9_.]+)\\.([A-Za-z0-9_]+)[ \t]*=[ \t]*function[ \t]*\\(",
|
|
|
|
"\\2.\\3", "j,jsfunction,javascript functions", NULL);
|
|
|
|
addTagRegex (language, "(^|[ \t])([A-Za-z0-9_.]+)\\.([A-Za-z0-9_]+)[ \t]*=[ \t]*function[ \t]*\\(",
|
|
|
|
"\\3", "j,jsfunction,javascript functions", NULL);
|
|
|
|
}
|
|
|
|
|
2010-03-07 16:50:20 +00:00
|
|
|
|
|
|
|
static void function_cb(const char *line, const regexMatch *matches, unsigned int count)
|
|
|
|
{
|
|
|
|
char *name, *arglist;
|
2010-04-17 16:12:22 +00:00
|
|
|
char kind = 'f';
|
2011-06-17 22:52:43 +00:00
|
|
|
static const char *kindName = "function";
|
2010-03-07 16:50:20 +00:00
|
|
|
tagEntryInfo e;
|
|
|
|
const regexMatch *match_funcname = NULL;
|
|
|
|
const regexMatch *match_arglist = NULL;
|
|
|
|
|
2010-04-17 16:12:22 +00:00
|
|
|
if (count > 2)
|
2010-03-07 16:50:20 +00:00
|
|
|
{
|
|
|
|
match_funcname = &matches[count - 2];
|
2010-04-17 16:12:22 +00:00
|
|
|
match_arglist = &matches[count - 1];
|
2010-03-07 16:50:20 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (match_funcname != NULL)
|
|
|
|
{
|
|
|
|
name = xMalloc(match_funcname->length + 1, char);
|
|
|
|
strncpy(name, line + match_funcname->start, match_funcname->length);
|
|
|
|
*(name+match_funcname->length) = '\x0';
|
|
|
|
arglist = xMalloc(match_arglist->length + 1, char);
|
|
|
|
strncpy(arglist, line + match_arglist->start, match_arglist->length);
|
|
|
|
*(arglist+match_arglist->length) = '\x0';
|
|
|
|
|
|
|
|
initTagEntry (&e, name);
|
2010-04-17 16:12:22 +00:00
|
|
|
e.kind = kind;
|
2010-03-07 16:50:20 +00:00
|
|
|
e.kindName = kindName;
|
|
|
|
e.extensionFields.arglist = arglist;
|
|
|
|
makeTagEntry (&e);
|
2011-02-06 16:03:27 +00:00
|
|
|
|
|
|
|
eFree(name);
|
|
|
|
eFree(arglist);
|
2010-03-07 16:50:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-11-17 19:27:50 +00:00
|
|
|
/* Create parser definition structure */
|
|
|
|
extern parserDefinition* PhpParser (void)
|
|
|
|
{
|
|
|
|
static const char *const extensions [] = { "php", "php3", "phtml", NULL };
|
|
|
|
parserDefinition* def = parserNew ("PHP");
|
|
|
|
def->extensions = extensions;
|
|
|
|
def->initialize = installPHPRegex;
|
|
|
|
def->regex = TRUE;
|
|
|
|
return def;
|
|
|
|
}
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
|
2005-11-22 12:26:26 +00:00
|
|
|
static boolean isLetter(const int c)
|
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
return (boolean)(isalpha(c) || (c >= 127 && c <= 255));
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static boolean isVarChar1(const int c)
|
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
return (boolean)(isLetter (c) || c == '_');
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static boolean isVarChar(const int c)
|
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
return (boolean)(isVarChar1 (c) || isdigit (c));
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static void findPhpTags (void)
|
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
vString *name = vStringNew ();
|
|
|
|
const unsigned char *line;
|
2005-11-22 12:26:26 +00:00
|
|
|
|
2007-07-09 15:11:18 +00:00
|
|
|
while ((line = fileReadLine ()) != NULL)
|
2005-11-22 12:26:26 +00:00
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
const unsigned char *cp = line;
|
|
|
|
const char* f;
|
|
|
|
|
|
|
|
while (isspace (*cp))
|
|
|
|
cp++;
|
|
|
|
|
|
|
|
if (*(const char*)cp == '$' && isVarChar1 (*(const char*)(cp+1)))
|
|
|
|
{
|
|
|
|
cp += 1;
|
|
|
|
vStringClear (name);
|
|
|
|
while (isVarChar ((int) *cp))
|
|
|
|
{
|
|
|
|
vStringPut (name, (int) *cp);
|
|
|
|
++cp;
|
|
|
|
}
|
|
|
|
while (isspace ((int) *cp))
|
|
|
|
++cp;
|
|
|
|
if (*(const char*) cp == '=')
|
|
|
|
{
|
|
|
|
vStringTerminate (name);
|
|
|
|
makeSimpleTag (name, PhpKinds, K_VARIABLE);
|
|
|
|
vStringClear (name);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if ((f = strstr ((const char*) cp, "function")) != NULL &&
|
|
|
|
(f == (const char*) cp || isspace ((int) f [-1])) &&
|
|
|
|
isspace ((int) f [8]))
|
|
|
|
{
|
|
|
|
cp = ((const unsigned char *) f) + 8;
|
|
|
|
|
|
|
|
while (isspace ((int) *cp))
|
|
|
|
++cp;
|
|
|
|
|
|
|
|
if (*cp == '&') /* skip reference character and following whitespace */
|
|
|
|
{
|
|
|
|
cp++;
|
|
|
|
|
|
|
|
while (isspace ((int) *cp))
|
2007-11-18 17:17:59 +00:00
|
|
|
++cp;
|
2007-07-09 15:11:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
vStringClear (name);
|
|
|
|
while (isalnum ((int) *cp) || *cp == '_')
|
|
|
|
{
|
|
|
|
vStringPut (name, (int) *cp);
|
|
|
|
++cp;
|
|
|
|
}
|
|
|
|
vStringTerminate (name);
|
|
|
|
makeSimpleTag (name, PhpKinds, K_FUNCTION);
|
|
|
|
vStringClear (name);
|
2007-11-18 17:17:59 +00:00
|
|
|
}
|
2007-11-17 19:27:50 +00:00
|
|
|
else if (strncmp ((const char*) cp, "class", (size_t) 5) == 0 &&
|
|
|
|
isspace ((int) cp [5]))
|
2007-07-09 15:11:18 +00:00
|
|
|
{
|
2007-11-17 19:27:50 +00:00
|
|
|
cp += 5;
|
2007-07-09 15:11:18 +00:00
|
|
|
|
|
|
|
while (isspace ((int) *cp))
|
|
|
|
++cp;
|
|
|
|
vStringClear (name);
|
|
|
|
while (isalnum ((int) *cp) || *cp == '_')
|
|
|
|
{
|
|
|
|
vStringPut (name, (int) *cp);
|
|
|
|
++cp;
|
|
|
|
}
|
|
|
|
vStringTerminate (name);
|
|
|
|
makeSimpleTag (name, PhpKinds, K_CLASS);
|
|
|
|
vStringClear (name);
|
|
|
|
}
|
|
|
|
else if (strncmp ((const char*) cp, "define", (size_t) 6) == 0 &&
|
|
|
|
! isalnum ((int) cp [6]))
|
|
|
|
{
|
|
|
|
cp += 6;
|
|
|
|
|
|
|
|
while (isspace ((int) *cp))
|
|
|
|
++cp;
|
|
|
|
if (*cp != '(')
|
|
|
|
continue;
|
|
|
|
++cp;
|
|
|
|
|
|
|
|
while (isspace ((int) *cp))
|
|
|
|
++cp;
|
|
|
|
if ((*cp == '\'') || (*cp == '"'))
|
|
|
|
++cp;
|
|
|
|
else if (! ((*cp == '_') || isalnum ((int) *cp)))
|
|
|
|
continue;
|
2007-11-18 17:17:59 +00:00
|
|
|
|
2007-07-09 15:11:18 +00:00
|
|
|
vStringClear (name);
|
|
|
|
while (isalnum ((int) *cp) || *cp == '_')
|
|
|
|
{
|
|
|
|
vStringPut (name, (int) *cp);
|
|
|
|
++cp;
|
|
|
|
}
|
|
|
|
vStringTerminate (name);
|
|
|
|
makeSimpleTag (name, PhpKinds, K_DEFINE);
|
|
|
|
vStringClear (name);
|
|
|
|
}
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
2007-07-09 15:11:18 +00:00
|
|
|
vStringDelete (name);
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
extern parserDefinition* PhpParser (void)
|
|
|
|
{
|
2007-07-09 15:11:18 +00:00
|
|
|
static const char *const extensions [] = { "php", "php3", "phtml", NULL };
|
|
|
|
parserDefinition* def = parserNew ("PHP");
|
|
|
|
def->kinds = PhpKinds;
|
|
|
|
def->kindCount = KIND_COUNT (PhpKinds);
|
|
|
|
def->extensions = extensions;
|
|
|
|
def->parser = findPhpTags;
|
|
|
|
return def;
|
2005-11-22 12:26:26 +00:00
|
|
|
}
|
|
|
|
|
2007-11-17 19:27:50 +00:00
|
|
|
#endif
|
2007-07-09 15:11:18 +00:00
|
|
|
|
|
|
|
/* vi:set tabstop=4 shiftwidth=4: */
|