|
1 |
| |
|
2 |
| |
|
3 |
| |
|
4 |
| package net.sourceforge.pmd.cpd; |
|
5 |
| |
|
6 |
| import java.io.File; |
|
7 |
| import java.io.FileNotFoundException; |
|
8 |
| import java.io.IOException; |
|
9 |
| import java.util.HashMap; |
|
10 |
| import java.util.HashSet; |
|
11 |
| import java.util.Iterator; |
|
12 |
| import java.util.List; |
|
13 |
| import java.util.Map; |
|
14 |
| import java.util.Set; |
|
15 |
| |
|
16 |
| public class CPD { |
|
17 |
| |
|
18 |
| private Map source = new HashMap(); |
|
19 |
| private CPDListener listener = new CPDNullListener(); |
|
20 |
| private Tokens tokens = new Tokens(); |
|
21 |
| private int minimumTileSize; |
|
22 |
| private MatchAlgorithm matchAlgorithm; |
|
23 |
| private Language language; |
|
24 |
| private boolean skipDuplicates; |
|
25 |
| |
|
26 |
0
| public CPD(int minimumTileSize, Language language) {
|
|
27 |
0
| this.minimumTileSize = minimumTileSize;
|
|
28 |
0
| this.language = language;
|
|
29 |
| } |
|
30 |
| |
|
31 |
0
| public void skipDuplicates() {
|
|
32 |
0
| this.skipDuplicates = true;
|
|
33 |
| } |
|
34 |
| |
|
35 |
0
| public void setCpdListener(CPDListener cpdListener) {
|
|
36 |
0
| this.listener = cpdListener;
|
|
37 |
| } |
|
38 |
| |
|
39 |
0
| public void go() {
|
|
40 |
0
| TokenEntry.clearImages();
|
|
41 |
0
| matchAlgorithm = new MatchAlgorithm(source, tokens, minimumTileSize, listener);
|
|
42 |
0
| matchAlgorithm.findMatches();
|
|
43 |
| } |
|
44 |
| |
|
45 |
0
| public Iterator getMatches() {
|
|
46 |
0
| return matchAlgorithm.matches();
|
|
47 |
| } |
|
48 |
| |
|
49 |
0
| public void add(File file) throws IOException {
|
|
50 |
0
| add(1, file);
|
|
51 |
| } |
|
52 |
| |
|
53 |
0
| public void addAllInDirectory(String dir) throws IOException {
|
|
54 |
0
| addDirectory(dir, false);
|
|
55 |
| } |
|
56 |
| |
|
57 |
0
| public void addRecursively(String dir) throws IOException {
|
|
58 |
0
| addDirectory(dir, true);
|
|
59 |
| } |
|
60 |
| |
|
61 |
0
| public void add(List files) throws IOException {
|
|
62 |
0
| for (Iterator i = files.iterator(); i.hasNext();) {
|
|
63 |
0
| add(files.size(), (File) i.next());
|
|
64 |
| } |
|
65 |
| } |
|
66 |
| |
|
67 |
0
| private void addDirectory(String dir, boolean recurse) throws IOException {
|
|
68 |
0
| if (!(new File(dir)).exists()) {
|
|
69 |
0
| throw new FileNotFoundException("Couldn't find directory " + dir);
|
|
70 |
| } |
|
71 |
0
| FileFinder finder = new FileFinder();
|
|
72 |
| |
|
73 |
0
| add(finder.findFilesFrom(dir, language.getFileFilter(), recurse));
|
|
74 |
| } |
|
75 |
| |
|
76 |
| private Set current = new HashSet(); |
|
77 |
| |
|
78 |
0
| private void add(int fileCount, File file) throws IOException {
|
|
79 |
| |
|
80 |
0
| if (skipDuplicates) {
|
|
81 |
| |
|
82 |
0
| String signature = file.getName() + '_' + file.length();
|
|
83 |
0
| if (current.contains(signature)) {
|
|
84 |
0
| System.out.println("Skipping " + file.getAbsolutePath() + " since it appears to be a duplicate file and --skip-duplicate-files is set");
|
|
85 |
0
| return;
|
|
86 |
| } |
|
87 |
0
| current.add(signature);
|
|
88 |
| } |
|
89 |
| |
|
90 |
0
| if (!file.getCanonicalPath().equals(file.getAbsolutePath())) {
|
|
91 |
0
| System.out.println("Skipping " + file + " since it appears to be a symlink");
|
|
92 |
0
| return;
|
|
93 |
| } |
|
94 |
| |
|
95 |
0
| listener.addedFile(fileCount, file);
|
|
96 |
0
| SourceCode sourceCode = new SourceCode(new SourceCode.FileCodeLoader(file));
|
|
97 |
0
| language.getTokenizer().tokenize(sourceCode, tokens);
|
|
98 |
0
| source.put(sourceCode.getFileName(), sourceCode);
|
|
99 |
| } |
|
100 |
| |
|
101 |
0
| public static Renderer getRendererFromString(String name) {
|
|
102 |
0
| if (name.equalsIgnoreCase("text") || name.equals("")) {
|
|
103 |
0
| return new SimpleRenderer();
|
|
104 |
| } |
|
105 |
0
| try {
|
|
106 |
0
| return (Renderer) Class.forName(name).newInstance();
|
|
107 |
| } catch (Exception e) { |
|
108 |
0
| System.out.println("Can't find class '" + name + "', defaulting to SimpleRenderer.");
|
|
109 |
| } |
|
110 |
0
| return new SimpleRenderer();
|
|
111 |
| } |
|
112 |
| |
|
113 |
0
| private static boolean findBooleanSwitch(String[] args, String name) {
|
|
114 |
0
| for (int i = 0; i < args.length; i++) {
|
|
115 |
0
| if (args[i].equals(name)) {
|
|
116 |
0
| return true;
|
|
117 |
| } |
|
118 |
| } |
|
119 |
0
| return false;
|
|
120 |
| } |
|
121 |
| |
|
122 |
0
| private static String findRequiredStringValue(String[] args, String name) {
|
|
123 |
0
| for (int i = 0; i < args.length; i++) {
|
|
124 |
0
| if (args[i].equals(name)) {
|
|
125 |
0
| return args[i + 1];
|
|
126 |
| } |
|
127 |
| } |
|
128 |
0
| System.out.println("No " + name + " value passed in");
|
|
129 |
0
| usage();
|
|
130 |
0
| throw new RuntimeException();
|
|
131 |
| } |
|
132 |
| |
|
133 |
0
| private static String findOptionalStringValue(String[] args, String name, String defaultValue) {
|
|
134 |
0
| for (int i = 0; i < args.length; i++) {
|
|
135 |
0
| if (args[i].equals(name)) {
|
|
136 |
0
| return args[i + 1];
|
|
137 |
| } |
|
138 |
| } |
|
139 |
0
| return defaultValue;
|
|
140 |
| } |
|
141 |
| |
|
142 |
0
| public static void main(String[] args) {
|
|
143 |
0
| if (args.length == 0) {
|
|
144 |
0
| usage();
|
|
145 |
| } |
|
146 |
| |
|
147 |
0
| try {
|
|
148 |
0
| boolean skipDuplicateFiles = findBooleanSwitch(args, "--skip-duplicate-files");
|
|
149 |
0
| String pathToFiles = findRequiredStringValue(args, "--files");
|
|
150 |
0
| String languageString = findOptionalStringValue(args, "--language", "java");
|
|
151 |
0
| String formatString = findOptionalStringValue(args, "--format", "text");
|
|
152 |
0
| int minimumTokens = Integer.parseInt(findRequiredStringValue(args, "--minimum-tokens"));
|
|
153 |
0
| LanguageFactory f = new LanguageFactory();
|
|
154 |
0
| Language language = f.createLanguage(languageString);
|
|
155 |
0
| Renderer renderer = CPD.getRendererFromString(formatString);
|
|
156 |
0
| CPD cpd = new CPD(minimumTokens, language);
|
|
157 |
0
| if (skipDuplicateFiles) {
|
|
158 |
0
| cpd.skipDuplicates();
|
|
159 |
| } |
|
160 |
0
| cpd.addRecursively(pathToFiles);
|
|
161 |
0
| cpd.go();
|
|
162 |
0
| System.out.println(renderer.render(cpd.getMatches()));
|
|
163 |
| } catch (Exception e) { |
|
164 |
0
| e.printStackTrace();
|
|
165 |
| } |
|
166 |
| } |
|
167 |
| |
|
168 |
0
| private static void usage() {
|
|
169 |
0
| System.out.println("Usage:");
|
|
170 |
0
| System.out.println(" java net.sourceforge.pmd.cpd.CPD --minimum-tokens xxx --files xxx [--language xxx] [--format (xml|text|csv)] [--skip-duplicate-files] ");
|
|
171 |
0
| System.out.println("i.e: ");
|
|
172 |
0
| System.out.println(" java net.sourceforge.pmd.cpd.CPD --minimum-tokens 100 --files c:\\jdk14\\src\\java ");
|
|
173 |
0
| System.out.println("or: ");
|
|
174 |
0
| System.out.println(" java net.sourceforge.pmd.cpd.CPD --minimum-tokens 100 --files /path/to/c/code --language c ");
|
|
175 |
0
| System.out.println("or: ");
|
|
176 |
0
| System.out.println(" java net.sourceforge.pmd.cpd.CPD --minimum-tokens 100 --files /path/to/java/code --format xml");
|
|
177 |
| } |
|
178 |
| |
|
179 |
| } |