mirror of
https://github.com/Rushilwiz/APCS.git
synced 2025-04-05 13:00:20 -04:00
147 lines
4.1 KiB
Java
147 lines
4.1 KiB
Java
// Name: B6-24
|
|
// Date: 12/11/19
|
|
// This program takes a text file, creates an index (by line numbers)
|
|
// for all the words in the file and writes the index
|
|
// into the output file. The program prompts the user for the file names.
|
|
|
|
import java.util.*;
|
|
import java.io.*;
|
|
|
|
public class IndexMaker
|
|
{
|
|
public static void main(String[] args) throws IOException
|
|
{
|
|
Scanner keyboard = new Scanner(System.in);
|
|
System.out.print("\nEnter input file name: ");
|
|
String inFileName = keyboard.nextLine().trim();
|
|
Scanner inputFile = new Scanner(new File(inFileName));
|
|
String outFileName = "fishIndex.txt";
|
|
PrintWriter outputFile = new PrintWriter(new FileWriter(outFileName));
|
|
indexDocument(inputFile, outputFile);
|
|
inputFile.close();
|
|
outputFile.close();
|
|
System.out.println("Done.");
|
|
}
|
|
public static void indexDocument(Scanner inputFile, PrintWriter outputFile)
|
|
{
|
|
DocumentIndex index = new DocumentIndex();
|
|
String line = null;
|
|
int lineNum = 0;
|
|
while(inputFile.hasNextLine())
|
|
{
|
|
lineNum++;
|
|
index.addAllWords(inputFile.nextLine(), lineNum);
|
|
}
|
|
for(IndexEntry entry : index)
|
|
outputFile.println(entry);
|
|
}
|
|
}
|
|
class DocumentIndex extends ArrayList<IndexEntry>
|
|
{
|
|
//constructors
|
|
public DocumentIndex() {
|
|
super();
|
|
}
|
|
|
|
public DocumentIndex(int a) {
|
|
super(a);
|
|
}
|
|
|
|
/** extracts all the words from str, skipping punctuation and whitespace
|
|
and for each word calls addWord(). In this situation, a good way to
|
|
extract while also skipping punctuation is to use String's split method,
|
|
e.g., str.split("[., \"!?]") */
|
|
public void addAllWords(String str, int lineNum)
|
|
{
|
|
String[] words = str.split("[., \"!?]");
|
|
for (int i = 0; i < words.length; i++)
|
|
if (!words[i].trim().equals(""))
|
|
addWord(words[i].trim(), lineNum);
|
|
}
|
|
|
|
/** calls foundOrInserted, which returns a position. At that position,
|
|
updates that IndexEntry's list of line numbers with lineNum. */
|
|
public void addWord(String word, int lineNum)
|
|
{
|
|
int index = foundOrInserted(word);
|
|
if (index != -1)
|
|
get(index).add(lineNum);
|
|
}
|
|
|
|
/** traverses this DocumentIndex and compares word to the words in the
|
|
IndexEntry objects in this list, looking for the correct position of
|
|
word. If an IndexEntry with word is not already in that position, the
|
|
method creates and inserts a new IndexEntry at that position. The
|
|
method returns the position of either the found or the inserted
|
|
IndexEntry.*/
|
|
private int foundOrInserted(String word)
|
|
{
|
|
word = word.toUpperCase();
|
|
|
|
if (size() == 0) {
|
|
add(new IndexEntry(word));
|
|
return 0;
|
|
}
|
|
|
|
for (int i = 0; i < size(); i++) {
|
|
IndexEntry ie = (IndexEntry)get(i);
|
|
if (ie.getWord().equals(word))
|
|
return i;
|
|
else if (ie.getWord().compareTo(word) > 0) {
|
|
add(i, new IndexEntry(word));
|
|
return i;
|
|
}
|
|
}
|
|
|
|
add(new IndexEntry(word));
|
|
return size()-1;
|
|
}
|
|
}
|
|
|
|
class IndexEntry implements Comparable<IndexEntry>
|
|
{
|
|
//fields
|
|
private String word;
|
|
private ArrayList<Integer> numsList;
|
|
|
|
//constructors
|
|
public IndexEntry (String a) {
|
|
word = a.toUpperCase();
|
|
numsList = new ArrayList<Integer>();
|
|
}
|
|
|
|
|
|
/** appends num to numsList, but only if it is not already in that list.
|
|
*/
|
|
public void add(int num)
|
|
{
|
|
if (!numsList.contains(num))
|
|
numsList.add(num);
|
|
}
|
|
|
|
/** this is a standard accessor method */
|
|
public String getWord()
|
|
{
|
|
return word;
|
|
}
|
|
|
|
/** returns a string representation of this Index Entry. */
|
|
public String toString()
|
|
{
|
|
String list = ""; Iterator it = numsList.iterator();
|
|
while(it.hasNext()) {
|
|
list += it.next();
|
|
if (it.hasNext())
|
|
list += ", ";
|
|
}
|
|
|
|
return word + " " + list;
|
|
}
|
|
|
|
public int compareTo(IndexEntry other) {
|
|
return word.compareTo(other.getWord());
|
|
}
|
|
|
|
}
|
|
|