xref: /netbsd-src/external/gpl3/gcc.old/dist/gcc/spellcheck-tree.c (revision e6c7e151de239c49d2e38720a061ed9d1fa99309)
1 /* Find near-matches for identifiers.
2    Copyright (C) 2015-2017 Free Software Foundation, Inc.
3 
4 This file is part of GCC.
5 
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
10 
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
14 for more details.
15 
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3.  If not see
18 <http://www.gnu.org/licenses/>.  */
19 
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "tree.h"
25 #include "cpplib.h"
26 #include "spellcheck-tree.h"
27 #include "selftest.h"
28 #include "stringpool.h"
29 
30 /* Calculate Levenshtein distance between two identifiers.  */
31 
32 edit_distance_t
33 levenshtein_distance (tree ident_s, tree ident_t)
34 {
35   gcc_assert (TREE_CODE (ident_s) == IDENTIFIER_NODE);
36   gcc_assert (TREE_CODE (ident_t) == IDENTIFIER_NODE);
37 
38   return levenshtein_distance (IDENTIFIER_POINTER (ident_s),
39 			       IDENTIFIER_LENGTH (ident_s),
40 			       IDENTIFIER_POINTER (ident_t),
41 			       IDENTIFIER_LENGTH (ident_t));
42 }
43 
44 /* Given TARGET, an identifier, and CANDIDATES, a vec of identifiers,
45    determine which element within CANDIDATES has the lowest edit
46    distance to TARGET.  If there are multiple elements with the
47    same minimal distance, the first in the vector wins.
48 
49    If more than half of the letters were misspelled, the suggestion is
50    likely to be meaningless, so return NULL_TREE for this case.  */
51 
52 tree
53 find_closest_identifier (tree target, const auto_vec<tree> *candidates)
54 {
55   gcc_assert (TREE_CODE (target) == IDENTIFIER_NODE);
56 
57   best_match<tree, tree> bm (target);
58   int i;
59   tree identifier;
60   FOR_EACH_VEC_ELT (*candidates, i, identifier)
61     {
62       gcc_assert (TREE_CODE (identifier) == IDENTIFIER_NODE);
63       bm.consider (identifier);
64     }
65 
66   return bm.get_best_meaningful_candidate ();
67 }
68 
69 /* A callback for cpp_forall_identifiers, for use by best_macro_match's ctor.
70    Process HASHNODE and update the best_macro_match instance pointed to be
71    USER_DATA.  */
72 
73 static int
74 find_closest_macro_cpp_cb (cpp_reader *, cpp_hashnode *hashnode,
75 			   void *user_data)
76 {
77   if (hashnode->type != NT_MACRO)
78     return 1;
79 
80   best_macro_match *bmm = (best_macro_match *)user_data;
81   bmm->consider (hashnode);
82 
83   /* Keep iterating.  */
84   return 1;
85 }
86 
87 /* Constructor for best_macro_match.
88    Use find_closest_macro_cpp_cb to find the closest matching macro to
89    NAME within distance < best_distance_so_far. */
90 
91 best_macro_match::best_macro_match (tree goal,
92 				    edit_distance_t best_distance_so_far,
93 				    cpp_reader *reader)
94 : best_match <goal_t, candidate_t> (goal, best_distance_so_far)
95 {
96   cpp_forall_identifiers (reader, find_closest_macro_cpp_cb, this);
97 }
98 
99 #if CHECKING_P
100 
101 namespace selftest {
102 
103 /* Selftests.  */
104 
105 /* Verify that find_closest_identifier is sane.  */
106 
107 static void
108 test_find_closest_identifier ()
109 {
110   auto_vec<tree> candidates;
111 
112   /* Verify that it can handle an empty vec.  */
113   ASSERT_EQ (NULL, find_closest_identifier (get_identifier (""), &candidates));
114 
115   /* Verify that it works sanely for non-empty vecs.  */
116   tree apple = get_identifier ("apple");
117   tree banana = get_identifier ("banana");
118   tree cherry = get_identifier ("cherry");
119   candidates.safe_push (apple);
120   candidates.safe_push (banana);
121   candidates.safe_push (cherry);
122 
123   ASSERT_EQ (apple, find_closest_identifier (get_identifier ("app"),
124 					     &candidates));
125   ASSERT_EQ (banana, find_closest_identifier (get_identifier ("banyan"),
126 					      &candidates));;
127   ASSERT_EQ (cherry, find_closest_identifier (get_identifier ("berry"),
128 					      &candidates));
129   ASSERT_EQ (NULL,
130 	     find_closest_identifier (get_identifier ("not like the others"),
131 				      &candidates));
132 }
133 
134 /* Run all of the selftests within this file.  */
135 
136 void
137 spellcheck_tree_c_tests ()
138 {
139   test_find_closest_identifier ();
140 }
141 
142 } // namespace selftest
143 
144 #endif /* #if CHECKING_P */
145