180 lines
5.8 KiB
Java
180 lines
5.8 KiB
Java
|
|
|
|
import edu.princeton.cs.introcs.In;
|
|
import edu.princeton.cs.introcs.StdIn;
|
|
import edu.princeton.cs.introcs.StdOut;
|
|
|
|
/*************************************************************************
|
|
* Compilation: javac SymbolGraph.java
|
|
* Execution: java SymbolGraph filename.txt delimiter
|
|
* Dependencies: ST.java Graph.java In.java StdIn.java StdOut.java
|
|
* Data files: http://algs4.cs.princeton.edu/41undirected/routes.txt
|
|
* http://algs4.cs.princeton.edu/41undirected/movies.txt
|
|
* http://algs4.cs.princeton.edu/41undirected/moviestiny.txt
|
|
* http://algs4.cs.princeton.edu/41undirected/moviesG.txt
|
|
* http://algs4.cs.princeton.edu/41undirected/moviestopGrossing.txt
|
|
*
|
|
* % java SymbolGraph routes.txt " "
|
|
* JFK
|
|
* MCO
|
|
* ATL
|
|
* ORD
|
|
* LAX
|
|
* PHX
|
|
* LAS
|
|
*
|
|
* % java SymbolGraph movies.txt "/"
|
|
* Tin Men (1987)
|
|
* Hershey, Barbara
|
|
* Geppi, Cindy
|
|
* Jones, Kathy (II)
|
|
* Herr, Marcia
|
|
* ...
|
|
* Blumenfeld, Alan
|
|
* DeBoy, David
|
|
* Bacon, Kevin
|
|
* Woodsman, The (2004)
|
|
* Wild Things (1998)
|
|
* Where the Truth Lies (2005)
|
|
* Tremors (1990)
|
|
* ...
|
|
* Apollo 13 (1995)
|
|
* Animal House (1978)
|
|
*
|
|
*
|
|
* Assumes that input file is encoded using UTF-8.
|
|
* % iconv -f ISO-8859-1 -t UTF-8 movies-iso8859.txt > movies.txt
|
|
*
|
|
*************************************************************************/
|
|
|
|
/**
|
|
* The SymbolGraph class represents an undirected graph, where the
|
|
* vertex names are arbitrary strings.
|
|
* By providing mappings between string vertex names and integers,
|
|
* it serves as a wrapper around the
|
|
* {@link Graph} data type, which assumes the vertex names are integers
|
|
* between 0 and V - 1.
|
|
* It also supports initializing a symbol graph from a file.
|
|
*
|
|
* This implementation uses an {@link ST} to map from strings to integers,
|
|
* an array to map from integers to strings, and a {@link Graph} to store
|
|
* the underlying graph.
|
|
* The index and contains operations take time
|
|
* proportional to log V , where V is the number of vertices.
|
|
* The name operation takes constant time.
|
|
*
|
|
* For additional documentation, see <a href="http://algs4.cs.princeton.edu/41undirected">Section 4.1</a> of
|
|
* Algorithms, 4th Edition by Robert Sedgewick and Kevin Wayne.
|
|
*
|
|
* @author Robert Sedgewick
|
|
* @author Kevin Wayne
|
|
*/
|
|
public class SymbolGraph {
|
|
private ST<String, Integer> st; // string -> index
|
|
private String[] keys; // index -> string
|
|
private Graph G;
|
|
|
|
/**
|
|
* Initializes a graph from a file using the specified delimiter.
|
|
* Each line in the file contains
|
|
* the name of a vertex, followed by a list of the names
|
|
* of the vertices adjacent to that vertex, separated by the delimiter.
|
|
* @param filename the name of the file
|
|
* @param delimiter the delimiter between fields
|
|
*/
|
|
public SymbolGraph(String filename, String delimiter) {
|
|
st = new ST<String, Integer>();
|
|
|
|
// First pass builds the index by reading strings to associate
|
|
// distinct strings with an index
|
|
In in = new In(filename);
|
|
// while (in.hasNextLine()) {
|
|
while (!in.isEmpty()) {
|
|
String[] a = in.readLine().split(delimiter);
|
|
for (int i = 0; i < a.length; i++) {
|
|
if (!st.contains(a[i]))
|
|
st.put(a[i], st.size());
|
|
}
|
|
}
|
|
StdOut.println("Done reading " + filename);
|
|
|
|
// inverted index to get string keys in an aray
|
|
keys = new String[st.size()];
|
|
for (String name : st.keys()) {
|
|
keys[st.get(name)] = name;
|
|
}
|
|
|
|
// second pass builds the graph by connecting first vertex on each
|
|
// line to all others
|
|
G = new Graph(st.size());
|
|
in = new In(filename);
|
|
while (in.hasNextLine()) {
|
|
String[] a = in.readLine().split(delimiter);
|
|
int v = st.get(a[0]);
|
|
for (int i = 1; i < a.length; i++) {
|
|
int w = st.get(a[i]);
|
|
G.addEdge(v, w);
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Does the graph contain the vertex named s ?
|
|
* @param s the name of a vertex
|
|
* @return true if s is the name of a vertex, and false otherwise
|
|
*/
|
|
public boolean contains(String s) {
|
|
return st.contains(s);
|
|
}
|
|
|
|
/**
|
|
* Returns the integer associated with the vertex named s .
|
|
* @param s the name of a vertex
|
|
* @return the integer (between 0 and V - 1) associated with the vertex named s
|
|
*/
|
|
public int index(String s) {
|
|
return st.get(s);
|
|
}
|
|
|
|
/**
|
|
* Returns the name of the vertex associated with the integer v .
|
|
* @param v the integer corresponding to a vertex (between 0 and V - 1)
|
|
* @return the name of the vertex associated with the integer v
|
|
*/
|
|
public String name(int v) {
|
|
return keys[v];
|
|
}
|
|
|
|
/**
|
|
* Returns the graph assoicated with the symbol graph. It is the client's responsibility
|
|
* not to mutate the graph.
|
|
* @return the graph associated with the symbol graph
|
|
*/
|
|
public Graph G() {
|
|
return G;
|
|
}
|
|
|
|
|
|
/**
|
|
* Unit tests the SymbolGraph data type.
|
|
*/
|
|
public static void main(String[] args) {
|
|
String filename = args[0];
|
|
String delimiter = args[1];
|
|
SymbolGraph sg = new SymbolGraph(filename, delimiter);
|
|
Graph G = sg.G();
|
|
while (StdIn.hasNextLine()) {
|
|
String source = StdIn.readLine();
|
|
if (sg.contains(source)) {
|
|
int s = sg.index(source);
|
|
for (int v : G.adj(s)) {
|
|
StdOut.println(" " + sg.name(v));
|
|
}
|
|
}
|
|
else {
|
|
StdOut.println("input not contain '" + source + "'");
|
|
}
|
|
}
|
|
}
|
|
}
|