package pfff

You can search for identifiers within the package.

in-package search v0.2.0

pfff
- Library commons
  - Common
    
    SMap
  - Common2
    
    olist
    
    BasicType
    
    Infix
    
    shared_variable_hook
    
    ArithFloatInfix
    
    StringSet
    
    IntMap
    
    IntIntMap
  - Dumper
  - File_type
  - Map_
  - OUnit
  - Ocaml
  - Set_
- Library commons_core
  - ANSITerminal
  - Console
  - Int
  - Logger
  - Math
  - Parallel
- Library pfff-commons-graph
  - Graphe
- Library pfff-config
  - Config_pfff
- Library pfff-graph_code
- Library pfff-h_files-format
- Library pfff-h_program-lang
- Library pfff-h_version-control
- Library pfff-h_visualization
  - Figures
  - Gnuplot
  - Html
  - Latex
  - Plot_jgraph
  - Simple_color
  - Treemap
- Library pfff-lang_FUZZY
- Library pfff-lang_GENERIC
  - Ast
  - Lang
  - Lib_ast
  - Map_ast
  - Meta_ast
  - Parse_generic
  - Test_parsing_generic
  - Visitor_ast
- Library pfff-lang_GENERIC-analyze
  - Controlflow
  - Controlflow_build
- Library pfff-lang_c
  - Ast_c
  - Ast_c_build
  - Lib_parsing_c
  - Meta_ast_c
  - Parse_c
  - Test_parsing_c
  - Unit_parsing_c
  - Visitor_c
    
    Ast_cpp
- Library pfff-lang_c-analyze
- Library pfff-lang_cpp
- Library pfff-lang_cpp-analyze
- Library pfff-lang_java
- Library pfff-lang_java-analyze
- Library pfff-lang_js
  - Cst_js
    
    PI
  - Flag_parsing_js
  - Lexer_js
    
    Flag
    
    PI
  - Lib_parsing_js
  - Meta_cst_js
  - Parse_js
  - Parser_js
  - Parsing_hacks_js
  - Test_parsing_js
  - Token_helpers_js
  - Unit_parsing_js
  - Visitor_js
- Library pfff-lang_js-analyze
- Library pfff-lang_ml
  - Cst_ml
  - Lexer_ml
    
    Ast
    
    Flag
  - Lib_parsing_ml
  - Meta_cst_ml
  - Parse_ml
  - Parser_ml
  - Test_parsing_ml
  - Token_helpers_ml
  - Unit_parsing_ml
  - Visitor_ml
- Library pfff-lang_ml-analyze
  - Ast_ml
  - Ast_ml_build
    
    A
  - Coverage_ml
  - Database_light_ml
  - Graph_code_ml
  - Highlight_ml
  - Ml_to_generic
    
    G
  - Module_ml
  - Tags_ml
  - Test_analyze_ml
  - Unit_analyze_ml
- Library pfff-lang_nw
- Library pfff-lang_nw-analyze
  - Highlight_nw
  - Test_analyze_nw
- Library pfff-lang_python
- Library pfff-lang_python-analyze
- Library pfff-linter
  - Check_all_generic
  - Check_cfg_generic
  - Entity_generic
  - Flag_linter
  - R2c
    
    J
    
    PI
    
    E
  - Unit_linter
- Library pfff-matcher
  - Flag_matcher
  - Fuzzy_vs_fuzzy
    
    PARAM
    
    X_VS_X
  - Generic_vs_generic
    
    A
    
    B
    
    MV
    
    Ast
    
    Lib
  - Matching_fuzzy
  - Matching_report
  - Metavars_fuzzy
  - Metavars_generic
  - Sgrep_fuzzy
  - Sgrep_generic
    
    Ast
    
    V
    
    GG
  - Spatch_fuzzy
  - Transforming_fuzzy
  - Unit_matcher
- Sources
  - commons
    
    common.ml
    
    common2.ml
    
    dumper.ml
    
    file_type.ml
    
    map_.ml
    
    oUnit.ml
    
    ocaml.ml
    
    set_.ml
  - commons_core
    
    ANSITerminal.ml
    
    console.ml
    
    int.ml
    
    logger.ml
    
    math.ml
    
    parallel.ml
  - pfff-commons-graph
    
    graphe.ml
  - pfff-config
    
    config_pfff.ml
  - pfff-graph_code
    
    dependencies_matrix_build.ml
    
    dependencies_matrix_code.ml
    
    graph_code.ml
    
    graph_code_checker.ml
    
    graph_code_class_analysis.ml
    
    graph_code_database.ml
    
    graph_code_export.ml
    
    graph_code_helpers.ml
    
    graph_code_opti.ml
    
    graph_code_prolog.ml
    
    graph_code_tags.ml
    
    layer_graph_code.ml
    
    test_graph_code.ml
    
    unit_graph_code.ml
  - pfff-h_files-format
    
    outline.ml
    
    simple_format.ml
    
    source_tree.ml
  - pfff-h_program-lang
    
    archi_code.ml
    
    archi_code_lexer.ml
    
    archi_code_parse.ml
    
    ast_fuzzy.ml
    
    ast_generic.ml
    
    big_grep.ml
    
    comment_code.ml
    
    coverage_code.ml
    
    database_code.ml
    
    datalog_code.ml
    
    entity_code.ml
    
    error_code.ml
    
    flag_parsing.ml
    
    highlight_code.ml
    
    info_code.ml
    
    layer_code.ml
    
    layer_coverage.ml
    
    layer_parse_errors.ml
    
    lib_ast_fuzzy.ml
    
    lib_unparser.ml
    
    meta_ast_fuzzy.ml
    
    meta_ast_generic_common.ml
    
    meta_parse_info.ml
    
    overlay_code.ml
    
    parse_info.ml
    
    pleac.ml
    
    pretty_print_code.ml
    
    prolog_code.ml
    
    refactoring_code.ml
    
    scope_code.ml
    
    skip_code.ml
    
    tags_file.ml
    
    test_program_lang.ml
    
    unit_program_lang.ml
  - pfff-h_version-control
    
    cvs.ml
    
    flag_version_control.ml
    
    generic_vcs.ml
    
    git.ml
    
    lib_vcs.ml
    
    mercurial.ml
    
    patch.ml
    
    subversion.ml
    
    test_version_control.ml
    
    unit_version_control.ml
    
    version_control.ml
  - pfff-h_visualization
    
    figures.ml
    
    gnuplot.ml
    
    html.ml
    
    latex.ml
    
    plot_jgraph.ml
    
    simple_color.ml
    
    treemap.ml
  - pfff-lang_FUZZY
    
    lang_fuzzy.ml
    
    parse_fuzzy.ml
    
    test_parsing_fuzzy.ml
  - pfff-lang_GENERIC
    
    ast.ml
    
    lang.ml
    
    lib_ast.ml
    
    map_ast.ml
    
    meta_ast.ml
    
    parse_generic.ml
    
    test_parsing_generic.ml
  - pfff-lang_GENERIC-analyze
    
    controlflow.ml
    
    controlflow_build.ml
  - pfff-lang_c
    
    ast_c.ml
    
    ast_c_build.ml
    
    lib_parsing_c.ml
    
    meta_ast_c.ml
    
    parse_c.ml
    
    test_parsing_c.ml
    
    unit_parsing_c.ml
    
    visitor_c.ml
  - pfff-lang_c-analyze
    
    ast_cil.ml
    
    c_to_generic.ml
    
    datalog_c.ml
    
    graph_code_c.ml
    
    meta_ast_cil.ml
    
    test_analyze_c.ml
  - pfff-lang_cpp
    
    cst_cpp.ml
    
    flag_parsing_cpp.ml
    
    lexer_cpp.ml
    
    lib_parsing_cpp.ml
    
    meta_cst_cpp.ml
    
    parse_cpp.ml
    
    parser_cpp.ml
    
    parser_cpp_mly_helper.ml
    
    parsing_hacks.ml
    
    parsing_hacks_cpp.ml
    
    parsing_hacks_define.ml
    
    parsing_hacks_lib.ml
    
    parsing_hacks_pp.ml
    
    parsing_hacks_typedef.ml
    
    parsing_recovery_cpp.ml
    
    pp_token.ml
    
    test_parsing_cpp.ml
    
    token_cpp.ml
    
    token_helpers_cpp.ml
    
    token_views_context.ml
    
    token_views_cpp.ml
    
    type_cpp.ml
    
    unit_parsing_cpp.ml
    
    visitor_cpp.ml
  - pfff-lang_cpp-analyze
    
    builtins_cpp.ml
    
    check_variables_cpp.ml
    
    database_light_cpp.ml
    
    flag_analyze_cpp.ml
    
    highlight_cpp.ml
    
    test_analyze_cpp.ml
  - pfff-lang_java
    
    ast_java.ml
    
    lexer_java.ml
    
    lib_parsing_java.ml
    
    meta_ast_java.ml
    
    parse_java.ml
    
    parser_java.ml
    
    parsing_hacks_java.ml
    
    test_parsing_java.ml
    
    token_helpers_java.ml
    
    unit_parsing_java.ml
    
    visitor_java.ml
  - pfff-lang_java-analyze
    
    builtins_java.ml
    
    graph_code_java.ml
    
    highlight_java.ml
    
    java_to_generic.ml
    
    package_java.ml
    
    test_analyze_java.ml
    
    unit_analyze_java.ml
  - pfff-lang_js
    
    cst_js.ml
    
    flag_parsing_js.ml
    
    lexer_js.ml
    
    lib_parsing_js.ml
    
    meta_cst_js.ml
    
    parse_js.ml
    
    parser_js.ml
    
    parsing_hacks_js.ml
    
    test_parsing_js.ml
    
    token_helpers_js.ml
    
    unit_parsing_js.ml
    
    visitor_js.ml
  - pfff-lang_js-analyze
    
    annotation_js.ml
    
    ast_js.ml
    
    ast_js_build.ml
    
    class_pre_es6.ml
    
    comment_js.ml
    
    database_light_js.ml
    
    graph_code_js.ml
    
    highlight_js.ml
    
    js_to_generic.ml
    
    lib_analyze_js.ml
    
    map_ast_js.ml
    
    meta_ast_js.ml
    
    module_path_js.ml
    
    module_pre_es6.ml
    
    stdlib_js.ml
    
    tags_js.ml
    
    test_analyze_js.ml
    
    transpile_js.ml
    
    unit_analyze_js.ml
    
    utils_js.ml
    
    visitor_ast_js.ml
  - pfff-lang_ml
    
    cst_ml.ml
    
    lexer_ml.ml
    
    lib_parsing_ml.ml
    
    meta_cst_ml.ml
    
    parse_ml.ml
    
    parser_ml.ml
    
    test_parsing_ml.ml
    
    token_helpers_ml.ml
    
    unit_parsing_ml.ml
    
    visitor_ml.ml
  - pfff-lang_ml-analyze
    
    ast_ml.ml
    
    ast_ml_build.ml
    
    coverage_ml.ml
    
    database_light_ml.ml
    
    graph_code_ml.ml
    
    highlight_ml.ml
    
    ml_to_generic.ml
    
    module_ml.ml
    
    tags_ml.ml
    
    test_analyze_ml.ml
    
    unit_analyze_ml.ml
  - pfff-lang_nw
    
    ast_nw.ml
    
    lexer_nw.ml
    
    parse_nw.ml
    
    test_parsing_nw.ml
    
    token_helpers_nw.ml
  - pfff-lang_nw-analyze
    
    highlight_nw.ml
    
    test_analyze_nw.ml
  - pfff-lang_python
    
    ast_python.ml
    
    lexer_python.ml
    
    lib_parsing_python.ml
    
    parse_python.ml
    
    parser_python.ml
    
    test_parsing_python.ml
    
    token_helpers_python.ml
  - pfff-lang_python-analyze
    
    database_light_python.ml
    
    highlight_python.ml
    
    python_to_generic.ml
    
    resolve_python.ml
    
    test_analyze_python.ml
  - pfff-linter
    
    check_all_generic.ml
    
    check_cfg_generic.ml
    
    entity_generic.ml
    
    flag_linter.ml
    
    r2c.ml
    
    unit_linter.ml
  - pfff-matcher
    
    flag_matcher.ml
    
    fuzzy_vs_fuzzy.ml
    
    generic_vs_generic.ml
    
    matching_fuzzy.ml
    
    matching_report.ml
    
    metavars_fuzzy.ml
    
    metavars_generic.ml
    
    sgrep_fuzzy.ml
    
    sgrep_generic.ml
    
    spatch_fuzzy.ml
    
    transforming_fuzzy.ml
    
    unit_matcher.ml

Legend:
Page
Library
Module
Module type
Parameter
Class
Class type
Source

Source file `ast_fuzzy.ml`

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
(* Yoann Padioleau
 *
 * Copyright (C) 2013 Facebook
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public License
 * version 2.1 as published by the Free Software Foundation, with the
 * special exception on linking described in file license.txt.
 *
 * This library is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the file
 * license.txt for more details.
 *)
open Common

(*****************************************************************************)
(* Prelude *)
(*****************************************************************************)
(* Sexp-like data structure to represent programs.
 *
 * When searching for or refactoring code, regexps are good enough most of 
 * the time; tools such as 'grep' or 'sed' are great. But certain regexps
 * are tedious to write when one needs to handle variations in spacing,
 * the possibilty to have comments in the middle of the code you
 * are looking for, or newlines. Things are even more complicated when
 * you want to handle nested parenthesized expressions or statements. This is
 * because regexps can't count. For instance how would you
 * remove a namespace in C++? You would like to write a transformation
 * like:
 * 
 *  - namespace my_namespace {
 *    ...
 *  - }
 * 
 * but regexps can't do that[1].
 * 
 * The alternative is then to use more precise tools such as 'sgrep'
 * or 'spatch'. But implementing sgrep/spatch in the usual way 
 * for a new language, by matching AST against AST, can be really tedious. 
 * The AST can be big and even if we can auto generate most of the
 * boilerplate code, this still takes quite some effort (see lang_php/matcher).
 * 
 * Moreover, in my experience matching AST against AST lacks
 * flexibility sometimes. For instance many people want to use 'sgrep' to
 * find a method foo and so do "sgrep -e 'foo(...)'" but
 * because the matching is done at the AST level, 'foo(...)' is
 * parsed as a function call, not a method call, and so it will
 * not work. But people expect it to work because it works
 * with regexps. So 'sgrep' for PHP currently forces people to write this
 * pattern '$V->foo(...)'.
 * In the same way a pattern like '1' was originally matching
 * only expressions, but was not matching static constants because
 * again it was a different AST constructor. Actually many
 * of the extensions and bugfixes in sgrep_php/spatch_php in 
 * the last year has been related to this lack of flexibility
 * because the AST was too precise.
 * 
 * Enter Ast_fuzzy, a way to factorize most of the needs of
 * 'sgrep' and 'spatch' over different programming languages,
 * while being more flexible in some ways than having a precise AST.
 * It fills a niche between regexps and very-precise ASTs.
 * 
 * In Ast_fuzzy we just want to keep the parenthesized information
 * from the code, and abstract away spacing, the main things that 
 * regexps have troubles with, and then let people match over this
 * parenthesized cleaned-up tree in a flexible way.
 * 
 * related:
 *  - xpath? but do programming languages need the full power of xpath?
 *    usually an AST just have 3 different kinds of nodes, Defs, Stmts,
 *    and Exprs.
 * 
 * See also lang_cpp/parsing_cpp/test_parsing_cpp and its parse_cpp_fuzzy()
 * and dump_cpp_fuzzy() functions. Most of the code related to Ast_fuzzy
 * is in matcher/ and called from 'sgrep' and 'spatch'.
 * For 'sgrep' and 'spatch' examples, see unit_matcher.ml as well as
 * tests/cpp/sgrep/ and tests/cpp/spatch/
 * 
 * notes:
 *  [1] Actually Perl regexps are more powerful so one can do for instance:
 *  echo 'something< namespace<x<y<z,t>>>, other >' | 
 *    perl -pe 's/namespace(<(?:[^<>]|(?1))*>)/foo/'
 *  => 'something< foo, other >'
 *  but it's arguably more complicated than the proposed spatch above.
 * 
 * todo:
 *  - handle infix operators: parse them not as a sequence
 *    but as a tree as we want for instance '$X->foo()' to match
 *    whole expression like 'this->bar()->foo()', or we want
 *    '$X' to match '1+1' (and not only in Parens context)
 *    updated: or use ast_generic.ml for that?
 *  - same for function calls? so maybe we need to transform our
 *    original program in a lisp like AST where things are more uniform
 *    updated: or use ast_generic.ml for that?
 *  - how to handle isomorphisms like 'order of attributes don't matter'
 *    as in XHP? or class that can be mentioned anywhere in the arguments
 *    to implements? or how can we make 'class X { ... }' to also match
 *    'class X extends whatever { ... }'? or have public/static to
 *    be optional?
 *    Use regexp over trees? Use isomorphisms file as in coccinelle?
 *    Have special mark about optional things in ast_fuzzy? 
 *    Derives such information from the grammar?
 *  - want powerful queries like 
 *      'class X { ... function(...) { ... foo() ... } ... }
 *    so sgrep powerful for microlevel queries, and prolog for macrolevel
 *    queries. Xpath? Css selector?
 *)

(*****************************************************************************)
(* Types *)
(*****************************************************************************)

type tok = Parse_info.t
type 'a wrap = 'a * tok

type tree =
  (* todo: comma *)
  | Parens of tok * (trees, tok (* comma*)) Common.either list * tok
  | Braces of tok * trees * tok
  | Angle  of tok * trees * tok
  | Bracket  of tok * trees * tok

  (* note that gcc allows $ in identifiers, so using $ for metavariables
   * means we will not be able to match such identifiers. No big deal.
   *)
  | Metavar of string wrap
  (* note that "..." are allowed in many languages, so using "..."
   * to represent a list of anything means we will not be able to
   * match specifically "...".
   *)
  | Dots of tok

  | Tok of string wrap
and trees = tree list
 (* with tarzan *)

let is_metavar s =
  s =~ "^\\$.*"

package pfff

Source file ast_fuzzy.ml

Source file `ast_fuzzy.ml`