forked from universal-ctags/ctags
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
FrontMatter: new subparser parser run from Markdown parser
In this version, just extracting "foo" in "title: foo" written in Yaml. JSON(;;;) and TOML(+++) are not supported yet. Close universal-ctags#3032. Signed-off-by: Masatake YAMATO <[email protected]>
- Loading branch information
Showing
9 changed files
with
336 additions
and
12 deletions.
There are no files selected for viewing
23 changes: 12 additions & 11 deletions
23
Units/parser-rmarkdown.r/simple-rmarkdown.d/expected.tags
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,11 +1,12 @@ | ||
S1 input.rmd /^# S1$/;" chapter line:1 language:Markdown end:14 | ||
xyX input.rmd /^```{r xyX}$/;" chunklabel line:3 language:RMarkdown extras:subparser | ||
S2 input.rmd /^# S2$/;" chapter line:15 language:Markdown end:25 | ||
__anon4a45a9700100 input.rmd /^```{r, cache = TRUE, dependson = "xyX"}$/;" chunklabel line:17 language:RMarkdown extras:subparser,anonymous | ||
__anon4a45a9700200 input.rmd /^```{python}$/;" chunklabel line:21 language:RMarkdown extras:subparser,anonymous | ||
S3 input.rmd /^# S3$/;" chapter line:26 language:Markdown end:27 | ||
x input.rmd /^x <- 1$/;" globalVar line:5 language:R extras:guest end:5 | ||
foo input.rmd /^foo <- function () {$/;" function line:6 language:R extras:guest end:9 | ||
y input.rmd /^ y <- 2$/;" functionVar line:7 language:R function:foo extras:guest end:7 | ||
X input.rmd /^X <- func()$/;" globalVar line:11 language:R extras:guest end:11 | ||
f input.rmd /^def f():$/;" function line:22 language:Python extras:guest end:24 | ||
S1 input.rmd /^# S1$/;" chapter line:4 language:Markdown end:17 | ||
xyX input.rmd /^```{r xyX}$/;" chunklabel line:6 language:RMarkdown extras:subparser | ||
S2 input.rmd /^# S2$/;" chapter line:18 language:Markdown end:28 | ||
__anon4a45a9700100 input.rmd /^```{r, cache = TRUE, dependson = "xyX"}$/;" chunklabel line:20 language:RMarkdown extras:subparser,anonymous | ||
__anon4a45a9700200 input.rmd /^```{python}$/;" chunklabel line:24 language:RMarkdown extras:subparser,anonymous | ||
S3 input.rmd /^# S3$/;" chapter line:29 language:Markdown end:30 | ||
x input.rmd /^x <- 1$/;" globalVar line:8 language:R extras:guest end:8 | ||
foo input.rmd /^foo <- function () {$/;" function line:9 language:R extras:guest end:12 | ||
y input.rmd /^ y <- 2$/;" functionVar line:10 language:R function:foo extras:guest end:10 | ||
X input.rmd /^X <- func()$/;" globalVar line:14 language:R extras:guest end:14 | ||
f input.rmd /^def f():$/;" function line:25 language:Python extras:guest end:27 | ||
example for u-ctags input.rmd /^title: example for u-ctags$/;" title line:2 language:FrontMatter extras:subparser |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,3 +1,6 @@ | ||
--- | ||
title: example for u-ctags | ||
--- | ||
# S1 | ||
|
||
```{r xyX} | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,89 @@ | ||
/* | ||
* | ||
* Copyright (c) 2022, Masatake YAMATO | ||
* Copyright (c) 2022, Red Hat, K.K. | ||
* | ||
* This source code is released for free distribution under the terms of the | ||
* GNU General Public License version 2 or (at your option) any later version. | ||
* | ||
* This module contains functions for extracting language objects in FrontMatter. | ||
* | ||
* https://gohugo.io/content-management/front-matter | ||
*/ | ||
|
||
/* | ||
* INCLUDE FILES | ||
*/ | ||
#include "general.h" /* must always come first */ | ||
|
||
#include "frontmatter.h" | ||
|
||
#include "entry.h" | ||
#include "parse.h" | ||
#include "promise.h" | ||
#include "read.h" | ||
|
||
#include <string.h> | ||
|
||
/* | ||
* DATA DEFINITIONS | ||
*/ | ||
static kindDefinition FrontMatterKinds [] = { | ||
{ true, 't', "title", "titles", }, | ||
}; | ||
|
||
/* | ||
* FUNCTION DEFINITIONS | ||
*/ | ||
static void findFrontMatterTags (void) | ||
{ | ||
const unsigned char *line = readLineFromInputFile (); | ||
|
||
if (line == NULL) | ||
return; | ||
|
||
#ifdef HAVE_LIBYAML | ||
if (strcmp("---", (const char *)line) == 0) | ||
{ | ||
line = readLineFromInputFile (); | ||
unsigned long endOffset = strlen((const char *)line); | ||
if (line) | ||
{ | ||
long startLineNum = getInputLineNumber (); | ||
while ((line = readLineFromInputFile())) | ||
endOffset = strlen((const char *)line); | ||
|
||
long endLineNum = getInputLineNumber (); | ||
|
||
makePromise ("YamlFrontMatter", startLineNum, 0, | ||
endLineNum, endOffset, startLineNum); | ||
} | ||
return; | ||
} | ||
#endif | ||
} | ||
|
||
extern parserDefinition* FrontMatterParser (void) | ||
{ | ||
parserDefinition* def = parserNew ("FrontMatter"); | ||
def->kindTable = FrontMatterKinds; | ||
def->kindCount = ARRAY_SIZE (FrontMatterKinds); | ||
|
||
def->parser = findFrontMatterTags; | ||
|
||
/* | ||
* This setting (useMemoryStreamInput) is for running | ||
* Yaml parser from YamlFrontMatter as subparser. | ||
* YamlFrontMatter is run from FrontMatter as a gust parser. | ||
* FrontMatter is run from Markdown as a guest parser. | ||
* This stacked structure hits the limitation of the main | ||
* part: subparser's requirement for memory based input stream | ||
* is not propagated to the main part. | ||
* | ||
* TODO: instead of setting useMemoryStreamInput here, we | ||
* should remove the limitation. | ||
*/ | ||
def->useMemoryStreamInput = true; | ||
|
||
return def; | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,19 @@ | ||
/* | ||
* Copyright (c) 2022, Masatake YAMATO <[email protected]> | ||
* | ||
* This source code is released for free distribution under the terms of the | ||
* GNU General Public License version 2 or (at your option) any later version. | ||
* | ||
* Frontmatter parser interface exported to the other parsers | ||
*/ | ||
|
||
#ifndef CTAGS_FRONTMATTER_H | ||
#define CTAGS_FRONTMATTER_H | ||
|
||
#include "general.h" | ||
|
||
typedef enum { | ||
FRONTMATTER_TITLE_KIND, | ||
} frontmatterKind; | ||
|
||
#endif |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,194 @@ | ||
/* | ||
* | ||
* Copyright (c) 2022, Masatake YAMATO | ||
* Copyright (c) 2022, Red Hat, K.K. | ||
* | ||
* This source code is released for free distribution under the terms of the | ||
* GNU General Public License version 2 or (at your option) any later version. | ||
* | ||
* This module contains functions for extracting language objects in FrontMatter | ||
* using Yaml. | ||
* | ||
* https://gohugo.io/content-management/front-matter | ||
*/ | ||
|
||
/* | ||
* INCLUDE FILES | ||
*/ | ||
#include "general.h" /* must always come first */ | ||
|
||
#include "frontmatter.h" | ||
#include "yaml.h" | ||
|
||
#include "entry.h" | ||
#include "gcc-attr.h" | ||
#include "parse.h" | ||
#include "read.h" | ||
#include "subparser.h" | ||
#include "trace.h" | ||
|
||
|
||
/* | ||
* DATA DECLARATIONS | ||
*/ | ||
enum yamlfrontmatterDetectingState { | ||
DSTAT_LAST_KEY, | ||
DSTAT_LAST_VALUE, | ||
DSTAT_INITIAL, | ||
}; | ||
|
||
struct sYamlFrontMatterSubparser { | ||
yamlSubparser yaml; | ||
enum yamlfrontmatterDetectingState detection_state; | ||
}; | ||
|
||
|
||
/* | ||
* FUNCTION PROTOTYPES | ||
*/ | ||
static bool yamlFrontmattterInitTagEntry (tagEntryInfo *e, char *name, void *data); | ||
|
||
|
||
/* | ||
* DATA DEFINITIONS | ||
*/ | ||
|
||
static langType frontMatterLang; | ||
|
||
static tagYpathTable ypathTables [] = { | ||
{ | ||
"title", | ||
DSTAT_LAST_VALUE, | ||
.initTagEntry = yamlFrontmattterInitTagEntry, | ||
}, | ||
}; | ||
|
||
|
||
/* | ||
* FUNCTION DEFINITIONS | ||
*/ | ||
|
||
static void yamlfrontmatterStateMachine (struct sYamlFrontMatterSubparser *yamlfrontmatter, | ||
yaml_token_t *token) | ||
{ | ||
#ifdef DO_TRACING | ||
ypathPrintTypeStack (YAML(yamlfrontmatter)); | ||
#endif | ||
|
||
switch (token->type) | ||
{ | ||
case YAML_KEY_TOKEN: | ||
yamlfrontmatter->detection_state = DSTAT_LAST_KEY; | ||
break; | ||
case YAML_SCALAR_TOKEN: | ||
switch (yamlfrontmatter->detection_state) | ||
{ | ||
case DSTAT_LAST_KEY: | ||
ypathFillKeywordOfTokenMaybe (YAML(yamlfrontmatter), token, getInputLanguage ()); | ||
/* FALL THROUGH */ | ||
case DSTAT_LAST_VALUE: | ||
TRACE_PRINT("token-callback: %s: %s", | ||
(yamlfrontmatter->detection_state == DSTAT_LAST_KEY)? "key": "value", | ||
(char*)token->data.scalar.value); | ||
ypathHandleToken (YAML(yamlfrontmatter), token, yamlfrontmatter->detection_state, | ||
ypathTables, ARRAY_SIZE (ypathTables)); | ||
break; | ||
default: | ||
break; | ||
} | ||
|
||
yamlfrontmatter->detection_state = DSTAT_INITIAL; | ||
|
||
break; | ||
case YAML_VALUE_TOKEN: | ||
yamlfrontmatter->detection_state = DSTAT_LAST_VALUE; | ||
break; | ||
|
||
default: | ||
yamlfrontmatter->detection_state = DSTAT_INITIAL; | ||
break; | ||
} | ||
} | ||
|
||
static void newTokenCallback (yamlSubparser *s, yaml_token_t *token) | ||
{ | ||
if (token->type == YAML_BLOCK_SEQUENCE_START_TOKEN | ||
|| token->type == YAML_BLOCK_MAPPING_START_TOKEN) | ||
ypathPushType (s, token); | ||
|
||
yamlfrontmatterStateMachine ((struct sYamlFrontMatterSubparser *)s, token); | ||
|
||
if (token->type == YAML_BLOCK_END_TOKEN) | ||
ypathPopType (s); | ||
else if (token->type == YAML_STREAM_END_TOKEN) | ||
ypathPopAllTypes (s); | ||
} | ||
|
||
static bool yamlFrontmattterInitTagEntry (tagEntryInfo *e, char *name, void * data CTAGS_ATTR_UNUSED) | ||
{ | ||
initForeignTagEntry (e, name, frontMatterLang, FRONTMATTER_TITLE_KIND); | ||
return true; | ||
} | ||
|
||
static void yamlFrontMatterInputStart(subparser *s) | ||
{ | ||
((struct sYamlFrontMatterSubparser*)s)->detection_state = DSTAT_INITIAL; | ||
((yamlSubparser*)s)->ypathTypeStack = NULL; | ||
} | ||
|
||
static void yamlFrontMatterInputEnd(subparser *s) | ||
{ | ||
Assert (((yamlSubparser*)s)->ypathTypeStack == NULL); | ||
} | ||
|
||
static void findYamlFrontMatterTags (void) | ||
{ | ||
scheduleRunningBaseparser (0); | ||
} | ||
|
||
static void yamlFrontMatterInitialize (langType language) | ||
{ | ||
ypathCompileTables (language, ypathTables, ARRAY_SIZE (ypathTables), 0); | ||
frontMatterLang = getNamedLanguage ("FrontMatter", 0); | ||
} | ||
|
||
static void yamlFrontMatterFinalize (langType language, bool initialized) | ||
{ | ||
if (initialized) | ||
ypathCompiledCodeDelete (ypathTables, ARRAY_SIZE (ypathTables)); | ||
} | ||
|
||
extern parserDefinition* YamlFrontMatter (void) | ||
{ | ||
static struct sYamlFrontMatterSubparser yamlfrontmatterSubparser = { | ||
.yaml = { | ||
.subparser = { | ||
.direction = SUBPARSER_SUB_RUNS_BASE, | ||
.inputStart = yamlFrontMatterInputStart, | ||
.inputEnd = yamlFrontMatterInputEnd, | ||
}, | ||
.newTokenNotfify = newTokenCallback | ||
}, | ||
}; | ||
static parserDependency dependencies [] = { | ||
{ DEPTYPE_SUBPARSER, "Yaml", &yamlfrontmatterSubparser }, | ||
{ DEPTYPE_FOREIGNER, "FrontMatter", NULL }, | ||
}; | ||
|
||
parserDefinition* const def = parserNew ("YamlFrontMatter"); | ||
|
||
def->dependencies = dependencies; | ||
def->dependencyCount = ARRAY_SIZE (dependencies); | ||
|
||
def->kindTable = NULL; | ||
def->kindCount = 0; | ||
def->parser = findYamlFrontMatterTags; | ||
def->initialize = yamlFrontMatterInitialize; | ||
def->finalize = yamlFrontMatterFinalize; | ||
|
||
/* This parser runs ONLY as a part of FrontMatter parser. | ||
* User may not want to enable/disable this parser directly. */ | ||
def->invisible = true; | ||
|
||
return def; | ||
} |
Oops, something went wrong.