001 /*
002 * Sonar, open source software quality management tool.
003 * Copyright (C) 2008-2012 SonarSource
004 * mailto:contact AT sonarsource DOT com
005 *
006 * Sonar is free software; you can redistribute it and/or
007 * modify it under the terms of the GNU Lesser General Public
008 * License as published by the Free Software Foundation; either
009 * version 3 of the License, or (at your option) any later version.
010 *
011 * Sonar is distributed in the hope that it will be useful,
012 * but WITHOUT ANY WARRANTY; without even the implied warranty of
013 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
014 * Lesser General Public License for more details.
015 *
016 * You should have received a copy of the GNU Lesser General Public
017 * License along with Sonar; if not, write to the Free Software
018 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02
019 */
020
021 package org.sonar.squid.recognizer;
022
023 import java.util.ArrayList;
024 import java.util.List;
025
026 public class CodeRecognizer {
027
028 private LanguageFootprint language;
029 private double threshold;
030
031 public CodeRecognizer(double threshold, LanguageFootprint language) {
032 this.language = language;
033 this.threshold = threshold;
034 }
035
036 public final double recognition(String line) {
037 double probability = 0;
038 for (Detector pattern : language.getDetectors()) {
039 probability = 1 - ((1 - probability) * (1 - pattern.recognition(line)));
040 }
041 return probability;
042 }
043
044 public final List<String> extractCodeLines(List<String> lines) {
045 ArrayList<String> codeLines = new ArrayList<String>();
046 for (String line : lines) {
047 if (recognition(line) >= threshold) {
048 codeLines.add(line);
049 }
050 }
051 return codeLines;
052 }
053
054 public final boolean isLineOfCode(String line) {
055 return recognition(line) - threshold > 0;
056 }
057 }