programming-examples/java/Data_Structures/SymbolGraph.java

180 lines
5.8 KiB
Java
Raw Normal View History

2019-11-15 12:59:38 +01:00
import edu.princeton.cs.introcs.In;
import edu.princeton.cs.introcs.StdIn;
import edu.princeton.cs.introcs.StdOut;
/*************************************************************************
* Compilation: javac SymbolGraph.java
* Execution: java SymbolGraph filename.txt delimiter
* Dependencies: ST.java Graph.java In.java StdIn.java StdOut.java
* Data files: http://algs4.cs.princeton.edu/41undirected/routes.txt
* http://algs4.cs.princeton.edu/41undirected/movies.txt
* http://algs4.cs.princeton.edu/41undirected/moviestiny.txt
* http://algs4.cs.princeton.edu/41undirected/moviesG.txt
* http://algs4.cs.princeton.edu/41undirected/moviestopGrossing.txt
*
* % java SymbolGraph routes.txt " "
* JFK
* MCO
* ATL
* ORD
* LAX
* PHX
* LAS
*
* % java SymbolGraph movies.txt "/"
* Tin Men (1987)
* Hershey, Barbara
* Geppi, Cindy
* Jones, Kathy (II)
* Herr, Marcia
* ...
* Blumenfeld, Alan
* DeBoy, David
* Bacon, Kevin
* Woodsman, The (2004)
* Wild Things (1998)
* Where the Truth Lies (2005)
* Tremors (1990)
* ...
* Apollo 13 (1995)
* Animal House (1978)
*
*
* Assumes that input file is encoded using UTF-8.
* % iconv -f ISO-8859-1 -t UTF-8 movies-iso8859.txt > movies.txt
*
*************************************************************************/
/**
* The SymbolGraph class represents an undirected graph, where the
* vertex names are arbitrary strings.
* By providing mappings between string vertex names and integers,
* it serves as a wrapper around the
* {@link Graph} data type, which assumes the vertex names are integers
* between 0 and V - 1.
* It also supports initializing a symbol graph from a file.
*
* This implementation uses an {@link ST} to map from strings to integers,
* an array to map from integers to strings, and a {@link Graph} to store
* the underlying graph.
* The index and contains operations take time
* proportional to log V , where V is the number of vertices.
* The name operation takes constant time.
*
* For additional documentation, see <a href="http://algs4.cs.princeton.edu/41undirected">Section 4.1</a> of
* Algorithms, 4th Edition by Robert Sedgewick and Kevin Wayne.
*
* @author Robert Sedgewick
* @author Kevin Wayne
*/
public class SymbolGraph {
private ST<String, Integer> st; // string -> index
private String[] keys; // index -> string
private Graph G;
/**
* Initializes a graph from a file using the specified delimiter.
* Each line in the file contains
* the name of a vertex, followed by a list of the names
* of the vertices adjacent to that vertex, separated by the delimiter.
* @param filename the name of the file
* @param delimiter the delimiter between fields
*/
public SymbolGraph(String filename, String delimiter) {
st = new ST<String, Integer>();
// First pass builds the index by reading strings to associate
// distinct strings with an index
In in = new In(filename);
// while (in.hasNextLine()) {
while (!in.isEmpty()) {
String[] a = in.readLine().split(delimiter);
for (int i = 0; i < a.length; i++) {
if (!st.contains(a[i]))
st.put(a[i], st.size());
}
}
StdOut.println("Done reading " + filename);
// inverted index to get string keys in an aray
keys = new String[st.size()];
for (String name : st.keys()) {
keys[st.get(name)] = name;
}
// second pass builds the graph by connecting first vertex on each
// line to all others
G = new Graph(st.size());
in = new In(filename);
while (in.hasNextLine()) {
String[] a = in.readLine().split(delimiter);
int v = st.get(a[0]);
for (int i = 1; i < a.length; i++) {
int w = st.get(a[i]);
G.addEdge(v, w);
}
}
}
/**
* Does the graph contain the vertex named s ?
* @param s the name of a vertex
* @return true if s is the name of a vertex, and false otherwise
*/
public boolean contains(String s) {
return st.contains(s);
}
/**
* Returns the integer associated with the vertex named s .
* @param s the name of a vertex
* @return the integer (between 0 and V - 1) associated with the vertex named s
*/
public int index(String s) {
return st.get(s);
}
/**
* Returns the name of the vertex associated with the integer v .
* @param v the integer corresponding to a vertex (between 0 and V - 1)
* @return the name of the vertex associated with the integer v
*/
public String name(int v) {
return keys[v];
}
/**
* Returns the graph assoicated with the symbol graph. It is the client's responsibility
* not to mutate the graph.
* @return the graph associated with the symbol graph
*/
public Graph G() {
return G;
}
/**
* Unit tests the SymbolGraph data type.
*/
public static void main(String[] args) {
String filename = args[0];
String delimiter = args[1];
SymbolGraph sg = new SymbolGraph(filename, delimiter);
Graph G = sg.G();
while (StdIn.hasNextLine()) {
String source = StdIn.readLine();
if (sg.contains(source)) {
int s = sg.index(source);
for (int v : G.adj(s)) {
StdOut.println(" " + sg.name(v));
}
}
else {
StdOut.println("input not contain '" + source + "'");
}
}
}
}