001    /*
002     * Sonar, open source software quality management tool.
003     * Copyright (C) 2008-2012 SonarSource
004     * mailto:contact AT sonarsource DOT com
005     *
006     * Sonar is free software; you can redistribute it and/or
007     * modify it under the terms of the GNU Lesser General Public
008     * License as published by the Free Software Foundation; either
009     * version 3 of the License, or (at your option) any later version.
010     *
011     * Sonar is distributed in the hope that it will be useful,
012     * but WITHOUT ANY WARRANTY; without even the implied warranty of
013     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
014     * Lesser General Public License for more details.
015     *
016     * You should have received a copy of the GNU Lesser General Public
017     * License along with Sonar; if not, write to the Free Software
018     * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02
019     */
020    
021    package org.sonar.squid.recognizer;
022    
023    import java.util.ArrayList;
024    import java.util.List;
025    
026    public class CodeRecognizer {
027    
028      private LanguageFootprint language;
029      private double            threshold;
030    
031      public CodeRecognizer(double threshold, LanguageFootprint language) {
032        this.language = language;
033        this.threshold = threshold;
034      }
035    
036      public final double recognition(String line) {
037        double probability = 0;
038        for (Detector pattern : language.getDetectors()) {
039          probability = 1 - ((1 - probability) * (1 - pattern.recognition(line)));
040        }
041        return probability;
042      }
043    
044      public final List<String> extractCodeLines(List<String> lines) {
045        ArrayList<String> codeLines = new ArrayList<String>();
046        for (String line : lines) {
047          if (recognition(line) >= threshold) {
048            codeLines.add(line);
049          }
050        }
051        return codeLines;
052      }
053    
054      public final boolean isLineOfCode(String line) {
055        return recognition(line) - threshold > 0;
056      }
057    }