| /* |
| * Copyright 2000-2012 JetBrains s.r.o. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package com.intellij.spellchecker.generator; |
| |
| import com.intellij.lang.Language; |
| import com.intellij.lang.LanguageNamesValidation; |
| import com.intellij.lang.refactoring.NamesValidator; |
| import com.intellij.openapi.diagnostic.Logger; |
| import com.intellij.openapi.progress.ProgressIndicator; |
| import com.intellij.openapi.progress.ProgressManager; |
| import com.intellij.openapi.project.Project; |
| import com.intellij.openapi.util.TextRange; |
| import com.intellij.openapi.util.io.FileUtil; |
| import com.intellij.openapi.vfs.VfsUtilCore; |
| import com.intellij.openapi.vfs.VirtualFile; |
| import com.intellij.openapi.vfs.VirtualFileVisitor; |
| import com.intellij.psi.PsiElement; |
| import com.intellij.psi.PsiFile; |
| import com.intellij.psi.PsiManager; |
| import com.intellij.psi.util.PsiTreeUtil; |
| import com.intellij.spellchecker.SpellCheckerManager; |
| import com.intellij.spellchecker.inspections.SpellCheckingInspection; |
| import com.intellij.spellchecker.inspections.Splitter; |
| import com.intellij.spellchecker.tokenizer.TokenConsumer; |
| import com.intellij.util.Consumer; |
| import com.intellij.util.containers.MultiMap; |
| import org.jetbrains.annotations.NotNull; |
| |
| import java.io.File; |
| import java.io.FileWriter; |
| import java.io.IOException; |
| import java.util.*; |
| |
| public abstract class SpellCheckerDictionaryGenerator { |
| private static final Logger LOG = Logger.getInstance("#com.intellij.spellchecker.generator.SpellCheckerDictionaryGenerator"); |
| private final Set<String> globalSeenNames = new HashSet<String>(); |
| protected final Project myProject; |
| private final String myDefaultDictName; |
| protected final String myDictOutputFolder; |
| protected final MultiMap<String, VirtualFile> myDict2FolderMap; |
| protected final Set<VirtualFile> myExcludedFolders = new HashSet<VirtualFile>(); |
| protected SpellCheckerManager mySpellCheckerManager; |
| |
| public SpellCheckerDictionaryGenerator(final Project project, final String dictOutputFolder, final String defaultDictName) { |
| myDict2FolderMap = new MultiMap<String, VirtualFile>(); |
| myProject = project; |
| myDefaultDictName = defaultDictName; |
| mySpellCheckerManager = SpellCheckerManager.getInstance(myProject); |
| myDictOutputFolder = dictOutputFolder; |
| } |
| |
| public void addFolder(String dictName, VirtualFile path) { |
| myDict2FolderMap.putValue(dictName, path); |
| } |
| |
| public void excludeFolder(VirtualFile folder) { |
| myExcludedFolders.add(folder); |
| } |
| |
| public void generate() { |
| ProgressManager.getInstance().runProcessWithProgressSynchronously(new Runnable() { |
| @Override |
| public void run() { |
| ProgressIndicator progressIndicator = ProgressManager.getInstance().getProgressIndicator(); |
| // let's do result a bit more predictable |
| |
| // ruby dictionary |
| generate(myDefaultDictName, progressIndicator); |
| |
| // other gem-related dictionaries in alphabet order |
| final List<String> dictionaries = new ArrayList<String>(myDict2FolderMap.keySet()); |
| Collections.sort(dictionaries); |
| |
| for (String dict : dictionaries) { |
| if (myDefaultDictName.equals(dict)) { |
| continue; |
| } |
| generate(dict, progressIndicator); |
| } |
| } |
| }, "Generating Dictionaries", false, myProject); |
| } |
| |
| private void generate(@NotNull String dict, ProgressIndicator progressIndicator) { |
| progressIndicator.setText("Processing dictionary: " + dict); |
| generateDictionary(myProject, myDict2FolderMap.get(dict), myDictOutputFolder + "/" + dict + ".dic", progressIndicator); |
| } |
| |
| private void generateDictionary(final Project project, final Collection<VirtualFile> folderPaths, final String outFile, |
| final ProgressIndicator progressIndicator) { |
| final HashSet<String> seenNames = new HashSet<String>(); |
| // Collect stuff |
| for (VirtualFile folder : folderPaths) { |
| progressIndicator.setText2("Scanning folder: " + folder.getPath()); |
| final PsiManager manager = PsiManager.getInstance(project); |
| processFolder(seenNames, manager, folder); |
| } |
| |
| if (seenNames.isEmpty()) { |
| LOG.info(" No new words was found."); |
| return; |
| } |
| |
| final StringBuilder builder = new StringBuilder(); |
| // Sort names |
| final ArrayList<String> names = new ArrayList<String>(seenNames); |
| Collections.sort(names); |
| for (String name : names) { |
| if (builder.length() > 0){ |
| builder.append("\n"); |
| } |
| builder.append(name); |
| } |
| try { |
| final File dictionaryFile = new File(outFile); |
| FileUtil.createIfDoesntExist(dictionaryFile); |
| final FileWriter writer = new FileWriter(dictionaryFile.getPath()); |
| try { |
| writer.write(builder.toString()); |
| } |
| finally { |
| writer.close(); |
| } |
| } |
| catch (IOException e) { |
| LOG.error(e); |
| } |
| } |
| |
| protected void processFolder(final HashSet<String> seenNames, final PsiManager manager, final VirtualFile folder) { |
| VfsUtilCore.visitChildrenRecursively(folder, new VirtualFileVisitor() { |
| @Override |
| public boolean visitFile(@NotNull VirtualFile file) { |
| if (myExcludedFolders.contains(file)) { |
| return false; |
| } |
| if (!file.isDirectory()) { |
| final PsiFile psiFile = manager.findFile(file); |
| if (psiFile != null) { |
| processFile(psiFile, seenNames); |
| } |
| } |
| return true; |
| } |
| }); |
| } |
| |
| protected abstract void processFile(PsiFile file, HashSet<String> seenNames); |
| |
| protected void process(final PsiElement element, @NotNull final HashSet<String> seenNames) { |
| final int endOffset = element.getTextRange().getEndOffset(); |
| |
| // collect leafs (spell checker inspection works with leafs) |
| final List<PsiElement> leafs = new ArrayList<PsiElement>(); |
| if (element.getChildren().length == 0) { |
| // if no children - it is a leaf! |
| leafs.add(element); |
| } else { |
| // else collect leafs under given element |
| PsiElement currentLeaf = PsiTreeUtil.firstChild(element); |
| while (currentLeaf != null && currentLeaf.getTextRange().getEndOffset() <= endOffset) { |
| leafs.add(currentLeaf); |
| currentLeaf = PsiTreeUtil.nextLeaf(currentLeaf); |
| } |
| } |
| |
| for (PsiElement leaf : leafs) { |
| processLeafsNames(leaf, seenNames); |
| } |
| } |
| |
| protected void processLeafsNames(@NotNull final PsiElement leafElement, @NotNull final HashSet<String> seenNames) { |
| final Language language = leafElement.getLanguage(); |
| SpellCheckingInspection.tokenize(leafElement, language, new TokenConsumer() { |
| @Override |
| public void consumeToken(PsiElement element, final String text, boolean useRename, int offset, TextRange rangeToCheck, Splitter splitter) { |
| splitter.split(text, rangeToCheck, new Consumer<TextRange>() { |
| @Override |
| public void consume(TextRange textRange) { |
| final String word = textRange.substring(text); |
| addSeenWord(seenNames, word, language); |
| } |
| }); |
| } |
| }); |
| } |
| |
| protected void addSeenWord(HashSet<String> seenNames, String word, Language language) { |
| final String lowerWord = word.toLowerCase(); |
| if (globalSeenNames.contains(lowerWord)) { |
| return; |
| } |
| |
| final NamesValidator namesValidator = LanguageNamesValidation.INSTANCE.forLanguage(language); |
| if (namesValidator != null && namesValidator.isKeyword(word, myProject)) { |
| return; |
| } |
| |
| globalSeenNames.add(lowerWord); |
| if (mySpellCheckerManager.hasProblem(lowerWord)){ |
| seenNames.add(lowerWord); |
| } |
| } |
| } |