lastest version of the web app

hb2143 [2005-09-25 03:17:40]
lastest version of the web app
Filename
config/content extractor settings.ini
config/hilabecker.ini
config/level13.ini
config/sb.ini
src/psl/crunch3/HttpStream.java
src/psl/crunch3/plugins/contentextractor/ContentExtractorSettings.java
src/psl/crunch3/web/LoginServlet.java
src/psl/crunch3/web/PresetServlet.java
src/psl/crunch3/web/RegisterBean.java
src/psl/crunch3/web/RegisterServlet.java
src/psl/crunch3/web/SettingsBean.java
src/psl/crunch3/web/SettingsServlet.java
src/psl/crunch3/web/Test.java
src/psl/crunch3/web/interface_files/crunch.css
src/psl/crunch3/web/interface_files/menu_r1_c1.gif
src/psl/crunch3/web/interface_files/menu_r1_c2.gif
src/psl/crunch3/web/interface_files/menu_r1_c3.gif
src/psl/crunch3/web/interface_files/menu_r1_c4.gif
src/psl/crunch3/web/interface_files/menu_r1_c5.gif
src/psl/crunch3/web/interface_files/spacer.gif
src/psl/crunch3/web/interface_files/title.png
users/abc1.ini
users/gabriela.ini
users/hila.ini
users/hila1.ini
users/hila123.ini
users/hila2.ini
users/hila3.ini
users/hila4.ini
users/hila5.ini
users/hilabecker.ini
users/null.ini
users/sb.ini
users/shlomo.ini
users/suhit.ini
users/test.ini
users/test1.ini
users/test12.ini
users/test2.ini
users/test3.ini
users/test4.ini
users/test83.ini
users/test88.ini
users/tester.ini
users/testing123.ini
users/yael.ini
diff --git a/config/content extractor settings.ini b/config/content extractor settings.ini
index da9e4b6..3a3b5a4 100644
--- a/config/content extractor settings.ini
+++ b/config/content extractor settings.ini
@@ -1,20 +1,20 @@
 #Content Extractor Settings File
-#Thu Aug 04 14:30:15 EDT 2005
+#Wed Sep 14 22:27:52 EDT 2005
 <A>\ tags\ are\ substance=true
 <FORM>\ tags\ are\ substance=true
-Ignore\ Image\ Links=false
+Ignore\ Image\ Links=true
 Ignore\ Meta\ Tags=true
 Display\ Image\ Link\ ALTs=true
-Ignore\ Text\ Links=false
+Ignore\ Text\ Links=true
 <INPUT>\ tags\ are\ substance=true
 Ignore\ <IFRAME>\ Tags=true
 <BUTTON>\ tags\ are\ substance=true
 Ignore\ All\ Advertisements=true
 <SELECT>\ tags\ are\ substance=true
-Ignore\ External\ Stylesheets=false
+Ignore\ External\ Stylesheets=true
 <IFRAME>\ tags\ are\ substance=true
 Ignore\ <EMBED>\ tags=true
-Ignore\ Styles=false
+Ignore\ Styles=true
 Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
 Ignore\ <INPUT>\ Tags=true
 Ignore\ Flash=true
@@ -22,21 +22,21 @@ Ignore\ Image\ Links\ in\ Link\ Lists=true
 <IMG>\ tags\ are\ substance=true
 <TEXTAREA>\ tags\ are\ substance=true
 Ignore\ Scripts=true
-Ignore\ Forms=false
+Ignore\ Forms=true
 Display\ Image\ ALTs=true
 Maximum\ Number\ of\ Line\ Breaks=2
-Ignore\ <BUTTON>\ Tags=false
+Ignore\ <BUTTON>\ Tags=true
 Limit\ Number\ of\ Line\ Breaks=false
-Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
 Ignore\ <NOSCRIPT>\ Tags=true
 Add\ removed\ links\ to\ bottom\ of\ the\ page=false
 Minimum\ text\ length\ as\ substance=12
-Remove\ Empty\ Tables=false
+Remove\ Empty\ Tables=true
 Ignore\ Text\ Links\ in\ Link\ Lists=true
 Ignore\ Table\ Cell\ Widths=true
-Ignore\ Style\ Attributes=false
+Ignore\ Style\ Attributes=true
 Ignore\ <SELECT>\ Tags=true
-Link/Text\ Removal\ Ratio=0.75
-Ignore\ Images=false
-Ignore\ Link\ Lists=false
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Ignore\ Link\ Lists=true
 Print\ Only\ Text=false
diff --git a/config/hilabecker.ini b/config/hilabecker.ini
deleted file mode 100644
index c7997f4..0000000
--- a/config/hilabecker.ini
+++ /dev/null
@@ -1,42 +0,0 @@
-#Content Extractor Settings File
-#Thu Feb 10 18:58:56 EST 2005
-<A>\ tags\ are\ substance=true
-<FORM>\ tags\ are\ substance=true
-Ignore\ Image\ Links=false
-Ignore\ Meta\ Tags=true
-Display\ Image\ Link\ ALTs=true
-Ignore\ Text\ Links=false
-<INPUT>\ tags\ are\ substance=true
-Ignore\ <IFRAME>\ Tags=true
-<BUTTON>\ tags\ are\ substance=true
-Ignore\ All\ Advertisements=true
-<SELECT>\ tags\ are\ substance=true
-Ignore\ External\ Stylesheets=false
-<IFRAME>\ tags\ are\ substance=true
-Ignore\ <EMBED>\ tags=true
-Ignore\ Styles=false
-Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
-Ignore\ <INPUT>\ Tags=true
-Ignore\ Flash=true
-Ignore\ Image\ Links\ in\ Link\ Lists=true
-<IMG>\ tags\ are\ substance=true
-<TEXTAREA>\ tags\ are\ substance=true
-Ignore\ Scripts=true
-Ignore\ Forms=false
-Display\ Image\ ALTs=true
-Maximum\ Number\ of\ Line\ Breaks=2
-Ignore\ <BUTTON>\ Tags=false
-Limit\ Number\ of\ Line\ Breaks=false
-Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
-Ignore\ <NOSCRIPT>\ Tags=true
-Add\ removed\ links\ to\ bottom\ of\ the\ page=false
-Minimum\ text\ length\ as\ substance=12
-Remove\ Empty\ Tables=false
-Ignore\ Text\ Links\ in\ Link\ Lists=true
-Ignore\ Table\ Cell\ Widths=true
-Ignore\ Style\ Attributes=false
-Ignore\ <SELECT>\ Tags=true
-Ignore\ Link\ Lists=false
-Link/Text\ Removal\ Ratio=0.75
-Ignore\ Images=false
-Print\ Only\ Text=false
diff --git a/config/level13.ini b/config/level13.ini
new file mode 100644
index 0000000..2f96204
--- /dev/null
+++ b/config/level13.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Tue Aug 16 12:10:16 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=false
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=false
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=false
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=false
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=false
+Ignore\ Flash=false
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=false
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=false
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=false
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=false
+Ignore\ Link\ Lists=false
+Ignore\ Images=false
+Link/Text\ Removal\ Ratio=0.3
+Print\ Only\ Text=false
diff --git a/config/sb.ini b/config/sb.ini
deleted file mode 100644
index c7997f4..0000000
--- a/config/sb.ini
+++ /dev/null
@@ -1,42 +0,0 @@
-#Content Extractor Settings File
-#Thu Feb 10 18:58:56 EST 2005
-<A>\ tags\ are\ substance=true
-<FORM>\ tags\ are\ substance=true
-Ignore\ Image\ Links=false
-Ignore\ Meta\ Tags=true
-Display\ Image\ Link\ ALTs=true
-Ignore\ Text\ Links=false
-<INPUT>\ tags\ are\ substance=true
-Ignore\ <IFRAME>\ Tags=true
-<BUTTON>\ tags\ are\ substance=true
-Ignore\ All\ Advertisements=true
-<SELECT>\ tags\ are\ substance=true
-Ignore\ External\ Stylesheets=false
-<IFRAME>\ tags\ are\ substance=true
-Ignore\ <EMBED>\ tags=true
-Ignore\ Styles=false
-Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
-Ignore\ <INPUT>\ Tags=true
-Ignore\ Flash=true
-Ignore\ Image\ Links\ in\ Link\ Lists=true
-<IMG>\ tags\ are\ substance=true
-<TEXTAREA>\ tags\ are\ substance=true
-Ignore\ Scripts=true
-Ignore\ Forms=false
-Display\ Image\ ALTs=true
-Maximum\ Number\ of\ Line\ Breaks=2
-Ignore\ <BUTTON>\ Tags=false
-Limit\ Number\ of\ Line\ Breaks=false
-Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
-Ignore\ <NOSCRIPT>\ Tags=true
-Add\ removed\ links\ to\ bottom\ of\ the\ page=false
-Minimum\ text\ length\ as\ substance=12
-Remove\ Empty\ Tables=false
-Ignore\ Text\ Links\ in\ Link\ Lists=true
-Ignore\ Table\ Cell\ Widths=true
-Ignore\ Style\ Attributes=false
-Ignore\ <SELECT>\ Tags=true
-Ignore\ Link\ Lists=false
-Link/Text\ Removal\ Ratio=0.75
-Ignore\ Images=false
-Print\ Only\ Text=false
diff --git a/src/psl/crunch3/HttpStream.java b/src/psl/crunch3/HttpStream.java
index b1f026d..8a1cd31 100644
--- a/src/psl/crunch3/HttpStream.java
+++ b/src/psl/crunch3/HttpStream.java
@@ -31,6 +31,7 @@ public class HttpStream extends Thread {
 	private static final char LF = '\n';
 	private static final String CRLF = "\r\n";
 	private static final int BUFFER_SIZE = 16384;
+

 	private static final String[] STATUS_STRINGS = { "0. Initializing", //0
 		"1. Reading Client First Line", //1
@@ -46,7 +47,9 @@ public class HttpStream extends Thread {
 	};

 	private int soTimeout = Crunch3.settings.getSocketTimeout();
-
+
+	private boolean isCrunchPage = false;
+
 	Socket clientSocket;
 	HttpMetadata clientMetadata = new HttpMetadata(HttpMetadata.CLIENT);

@@ -126,7 +129,23 @@ public class HttpStream extends Thread {

 		// try to read the first line from the client
 		try {
-			clientMetadata.setFirstLine(readLine(clientSocket.getInputStream()));
+			String get = readLine(clientSocket.getInputStream());
+			clientMetadata.setFirstLine(get);
+
+			if(get.contains("rector.psl.cs.columbia.edu/crunch")){
+				//Crunch3.mainControl.loadFile("config"+ File.separator +"level13.ini");
+				if(get.contains("rector.psl.cs.columbia.edu/crunch/register.htm") || get.contains("rector.psl.cs.columbia.edu/crunch/slogin.html")
+						|| get.contains("rector.psl.cs.columbia.edu/crunch/Register.jsp") || get.contains("rector.psl.cs.columbia.edu/crunch/login.htm")){
+				int start = get.lastIndexOf("HTTP");
+				get = get.substring(0,start-1) + "?ip=" + clientSocket.getInetAddress() + " " + get.substring(start);
+
+				clientMetadata.setFirstLine(get);
+				}
+				isCrunchPage = true;
+			}
+			else{
+				isCrunchPage = false;
+			}
 		} catch (IOException ioe) {
 			// shutdown on an error
 			if (Crunch3.settings.isVerbose())
@@ -317,6 +336,8 @@ public class HttpStream extends Thread {
 		// only filter if not homepage or filter homepages turned on
 		shouldFilter = shouldFilter && (Crunch3.settings.isFilterHomepages() || !isHomepage());

+		//only filter if not crunch page
+		shouldFilter = shouldFilter && !isCrunchPage;
 		if (shouldFilter)
 			contentFile = filter();

@@ -641,22 +662,24 @@ public class HttpStream extends Thread {
     		System.out.println("changing settings");
     		System.out.println();
     	}
-		System.out.println("********************working working");
+

 		if(con != null){
 			try{
-				System.out.println("**********");
+
 				stmt = con.createStatement();

 	            stmt.execute("select user from connected where ip='" + clientSocket.getInetAddress() + "'");

+	            System.out.println(clientSocket.getInetAddress());
 	            rs= stmt.getResultSet();
 	            if(!rs.next()){
 	            	//load default settings
+	            	System.out.println("problem \n");
 	            }
 	            else{
 	            	String username=rs.getString(1);
-	            	Crunch3.mainControl.loadFile("config" +File.separator+ username+".ini");
+	            	Crunch3.mainControl.loadFile("users" +File.separator+ username+".ini");
 	            	if (Crunch3.settings.isVerbose()){
 	            		System.out.println("settings file loaded for user " + username);
 	            	}
diff --git a/src/psl/crunch3/plugins/contentextractor/ContentExtractorSettings.java b/src/psl/crunch3/plugins/contentextractor/ContentExtractorSettings.java
index 4718479..c06e16a 100644
--- a/src/psl/crunch3/plugins/contentextractor/ContentExtractorSettings.java
+++ b/src/psl/crunch3/plugins/contentextractor/ContentExtractorSettings.java
@@ -96,6 +96,12 @@ public class ContentExtractorSettings implements ContentExtractorConstants {
 		loadSettings();
 	}

+	public void changeFile(String f){
+		mSettingsFile = f;
+		loadSettingsProperties();
+		loadSettings();
+	}
+
 	/**
 	 * Returns a setting based on the final variables
 	 *
diff --git a/src/psl/crunch3/web/LoginServlet.java b/src/psl/crunch3/web/LoginServlet.java
index 8bb9a79..96882e5 100644
--- a/src/psl/crunch3/web/LoginServlet.java
+++ b/src/psl/crunch3/web/LoginServlet.java
@@ -24,22 +24,48 @@ public class LoginServlet extends HttpServlet{
 			s.setAttribute("lb", lb);
 		}

+		boolean done = false;
+
+
+		if((request.getParameter("reset")).equals("true")){
+
+			done =(lb.resetPassword(request.getParameter("username"),request.getParameter("lastname"),request.getParameter("password")));
+
+
+		}
+
+
+
 		lb.setUsername((request.getParameter("username")));
 	    lb.setPassword((request.getParameter("password")));

 			Cookie c = new Cookie("crunch", lb.getUsername());
-        	InetAddress remoteInetAddress = InetAddress.getByName(request.getRemoteAddr());
+        	InetAddress remoteInetAddress = InetAddress.getByName(request.getRemoteAddr());
+        	if((remoteInetAddress.toString()).equals("/128.59.14.166")){
+        		remoteInetAddress = InetAddress.getByName(((request.getParameter("ip")).substring(1)));
+        	}
         if(lb.authenticate(remoteInetAddress)){
         	lb.login(remoteInetAddress);
         	response.addCookie(c);
+
+        	HttpSession session = (request.getSession(true));
+        	session.setAttribute("name",lb.getUsername());
+
 			RequestDispatcher r = getServletContext().getRequestDispatcher(
-	          "/interface.htm");
+	          "/presets.html");
 	        r.forward(request, response);
 		}
 		else{
-			RequestDispatcher r = getServletContext().getRequestDispatcher(
-	          "/login.htm");
-	        r.forward(request, response);
+			if((request.getParameter("reset")).equals("true")){
+				RequestDispatcher r = getServletContext().getRequestDispatcher(
+		          "/tryagain.html");
+		        r.forward(request, response);
+			}
+			else{
+				RequestDispatcher r = getServletContext().getRequestDispatcher(
+				"/login.htm");
+	        	r.forward(request, response);
+			}
 		}

 	}
@@ -50,4 +76,6 @@ public class LoginServlet extends HttpServlet{
 	  }


+
+
 }
diff --git a/src/psl/crunch3/web/PresetServlet.java b/src/psl/crunch3/web/PresetServlet.java
new file mode 100644
index 0000000..6148172
--- /dev/null
+++ b/src/psl/crunch3/web/PresetServlet.java
@@ -0,0 +1,125 @@
+package psl.crunch3.web;
+
+import javax.servlet.*;
+import javax.servlet.http.*;
+
+import psl.crunch3.plugins.contentextractor.ContentExtractor;
+
+
+import java.io.*;
+
+
+public class PresetServlet extends HttpServlet{
+
+	public void doGet(HttpServletRequest request, HttpServletResponse response)
+    throws ServletException, IOException {
+
+		String choice = request.getParameter("preset");
+		Cookie[] cookies = request.getCookies();
+		String username=null;
+
+		if(cookies !=null){
+			for(int i=0;i<cookies.length;i++){
+				if ((cookies[i].getName()).equals("crunch")){
+					username = cookies[i].getValue();
+					break;
+				}
+			}
+		}
+
+		if(username==null){
+			RequestDispatcher r = getServletContext().getRequestDispatcher(
+	          "/login.htm");
+	        r.forward(request, response);
+		}
+		else if(choice.equals("custom")){
+			RequestDispatcher r = getServletContext().getRequestDispatcher(
+	          "/interface.jsp");
+	        r.forward(request, response);
+
+		}
+		else {
+
+
+			if(choice.equals("shopping")){
+
+				copy(username, ContentExtractor.LEVEL7_SETTINGS_FILE_DEF );
+			}
+		else if(choice.equals("news")){
+			copy(username, ContentExtractor.LEVEL2_SETTINGS_FILE_DEF );
+		}
+		else if(choice.equals("textheavy")){
+
+			copy(username, ContentExtractor.LEVEL2_SETTINGS_FILE_DEF );
+		}
+		else if(choice.equals("linkheavy")){
+
+			copy(username, ContentExtractor.LEVEL10_SETTINGS_FILE_DEF );
+		}
+		else if(choice.equals("government")){
+
+			copy(username, ContentExtractor.LEVEL5_SETTINGS_FILE_DEF );
+		}
+		else if(choice.equals("education")){
+
+			copy(username, ContentExtractor.LEVEL6_SETTINGS_FILE_DEF );
+		}
+		else{
+			copy(username, ContentExtractor.LEVEL11_SETTINGS_FILE_DEF );
+		}
+
+			RequestDispatcher r = getServletContext().getRequestDispatcher(
+	          "/presets.html");
+	        r.forward(request, response);
+
+
+	}
+
+
+
+
+
+
+
+	}
+
+
+
+	  //Process the HTTP Post request
+	  public void doPost(HttpServletRequest request, HttpServletResponse response)
+	      throws ServletException, IOException {
+	    doGet(request, response);
+	  }
+
+
+
+
+
+
+	  private boolean copy(String tof, String fromf){
+
+		  try{
+				 File fromFile = new File("/home/hila/eclipse/workspace/crunch3/" + fromf);
+				 File toFile = new File("/home/hila/eclipse/workspace/crunch3/users/" + tof + ".ini");
+
+				 FileInputStream from = new FileInputStream(fromFile);
+				 FileOutputStream to = new FileOutputStream(toFile);
+
+				 byte[] buff = new byte[4096];
+				 int i;
+
+				 while ((i = from.read(buff))!=-1){
+					 to.write(buff, 0,i);
+				 }
+				 from.close();
+				 to.close();
+				 return true;
+			 }
+			 catch(Exception e){
+				 return false;
+			 }
+
+
+
+	  }
+}
diff --git a/src/psl/crunch3/web/RegisterBean.java b/src/psl/crunch3/web/RegisterBean.java
index b2b36c2..3dd87eb 100644
--- a/src/psl/crunch3/web/RegisterBean.java
+++ b/src/psl/crunch3/web/RegisterBean.java
@@ -5,6 +5,8 @@ import java.net.InetAddress;
 import java.security.*;
 import java.sql.*;

+import javax.servlet.RequestDispatcher;
+
 public class RegisterBean implements Serializable{

 	private String firstName, lastName, email;
@@ -211,8 +213,8 @@ public class RegisterBean implements Serializable{
 	            stmt = conn.createStatement();

 	            stmt.execute("insert into user values ('" + username + "' , '"+
-	            		firstName + "' , '"+ lastName + "' , '"+ email + "' , '"+
-	            		encrypt(password) + "')");
+	            		firstName + "' , '"+ lastName + "' , '"+ email + "' , "+
+	            		"MD5('" +password +"' ) )");
 	            inserted="true";
 	            return true;

@@ -302,6 +304,8 @@ public class RegisterBean implements Serializable{
 		 Statement stmt = null;
 		 ResultSet rs = null;

+		 boolean result=true;
+
 		 try {


@@ -310,18 +314,15 @@ public class RegisterBean implements Serializable{

 	            stmt = conn.createStatement();

-	            stmt.execute("select password from user where username='" + username +  "'");
+	            stmt.execute("select username from user where username='" + username + "' and password=MD5('"+ password + "')");
 	            rs = stmt.getResultSet();

 	            if(!rs.next()){
-	            	return false;
-	            }
-	            else{
-	            	if( !(rs.getString(1)).equals(password))
-	            		return false;
+	            	result= false;
 	            }


+
 	            //remove row from connected table
 	            stmt = conn.createStatement();

@@ -336,7 +337,7 @@ public class RegisterBean implements Serializable{

 	     }
 		 catch (Exception ex) {
-			 return false;
+			 result= false;
 	     }
 		 finally {

@@ -351,15 +352,16 @@ public class RegisterBean implements Serializable{
 			}

 		}
-		 return true;
+		 return result;


 	 }

-	 public boolean login(InetAddress address){
+	 public String login(InetAddress address){

 		 Statement stmt = null;

+		 String result = "true";
 			 try {


@@ -370,15 +372,10 @@ public class RegisterBean implements Serializable{

 		            stmt.execute("insert into connected values ('" + username + "' , '"+
 		            		address + "')");
-
-
-
-
-

 		     }
 			 catch (Exception ex) {
-				 return false;
+				 result = ex.getMessage();
 		     }
 			 finally {

@@ -393,6 +390,73 @@ public class RegisterBean implements Serializable{
 				}

 			}
+			 return result;
+	 }
+
+
+	 /**
+	  * Creates a new settings file where the user's preferred settings
+	  * would be stored. The default file settings would be the same as config/level6.ini
+	  */
+	 public boolean createUserPrefFile(){
+
+		 try{
+			 File fromFile = new File("/home/hila/eclipse/workspace/crunch3/config/level6.ini");
+			 File toFile = new File("/home/hila/eclipse/workspace/crunch3/users/" + username + ".ini");
+
+			 FileInputStream from = new FileInputStream(fromFile);
+			 FileOutputStream to = new FileOutputStream(toFile);
+
+			 byte[] buff = new byte[4096];
+			 int i;
+
+			 while ((i = from.read(buff))!=-1){
+				 to.write(buff, 0,i);
+			 }
+			 from.close();
+			 to.close();
 			 return true;
+		 }
+		 catch(Exception e){
+			 return false;
+		 }
+
+
 	 }
+
+	 public boolean resetPassword(String userName, String lastName, String pass){
+		 Statement stmt = null;
+
+		 boolean result =true;
+			 try {
+
+				   if(conn==null) connect();
+
+		            stmt = conn.createStatement();
+
+		            stmt.execute("update user set password=MD5('"+ pass + "') where username = '" +userName + "' and "+
+		            		"lastname = '" + lastName + "'");
+
+		     }
+			 catch (Exception ex) {
+				 result = false;
+		     }
+			 finally {
+
+
+				    if (stmt != null) {
+				        try {
+				            stmt.close();
+				        } catch (SQLException sqlEx) { // ignore }
+
+				        stmt = null;
+				    }
+				}
+
+			}
+			 return result;
+	 }
+
+
+
 }
diff --git a/src/psl/crunch3/web/RegisterServlet.java b/src/psl/crunch3/web/RegisterServlet.java
index 79bc4a4..fbeb520 100644
--- a/src/psl/crunch3/web/RegisterServlet.java
+++ b/src/psl/crunch3/web/RegisterServlet.java
@@ -62,12 +62,25 @@ public class RegisterServlet extends HttpServlet{
 	        if(rb.writeToDB()){

 	        	Cookie c = new Cookie("crunch", rb.getUsername());
-	        	InetAddress remoteInetAddress = InetAddress.getByName(request.getRemoteAddr());
-	        	rb.login(remoteInetAddress);
-	        	response.addCookie(c);
-	        	RequestDispatcher r = getServletContext().getRequestDispatcher(
-		          "/success.jsp");
-		        r.forward(request, response);
+	        	InetAddress remoteInetAddress = InetAddress.getByName(request.getRemoteAddr());
+	        	if((remoteInetAddress.toString()).equals("/128.59.14.166")){
+	        		remoteInetAddress = InetAddress.getByName(((request.getParameter("ip")).substring(1)));
+	        	}
+	        	rb.createUserPrefFile();
+	        	rb.authenticate(remoteInetAddress);
+	        	String s1 = rb.login(remoteInetAddress);
+	        	if(s1.equals("true")){
+	        		response.addCookie(c);
+	        		HttpSession session = (request.getSession(true));
+	        		session.setAttribute("name",rb.getUsername());
+	        		RequestDispatcher r = getServletContext().getRequestDispatcher(
+	        			"/presets.html");
+	        		r.forward(request, response);
+	        	}
+	        	else{
+	        		RequestDispatcher r = getServletContext().getRequestDispatcher("/Register.jsp");
+	        		r.forward(request, response);
+	        	}
 	        }
 	        else {RequestDispatcher r = getServletContext().getRequestDispatcher(
 	          "/Register.jsp");
diff --git a/src/psl/crunch3/web/SettingsBean.java b/src/psl/crunch3/web/SettingsBean.java
index d403198..dd499db 100644
--- a/src/psl/crunch3/web/SettingsBean.java
+++ b/src/psl/crunch3/web/SettingsBean.java
@@ -3,14 +3,18 @@ package psl.crunch3.web;
 import java.io.Serializable;

 import org.eclipse.swt.SWT;
+import org.eclipse.swt.events.SelectionEvent;
 import org.eclipse.swt.widgets.Button;
 import org.eclipse.swt.widgets.Composite;
+import org.eclipse.swt.widgets.Event;
 import org.eclipse.swt.widgets.Group;
 import org.eclipse.swt.widgets.Label;
 import org.eclipse.swt.widgets.Sash;
 import org.eclipse.swt.widgets.TabItem;
 import org.eclipse.swt.widgets.Text;

+import java.io.*;
+
 import psl.crunch3.Crunch3;
 import psl.crunch3.plugins.contentextractor.ContentExtractorConstants;
 import psl.crunch3.plugins.contentextractor.ContentExtractorSettings;
@@ -63,6 +67,7 @@ public class SettingsBean implements Serializable {
 	private boolean limitLineBreaks;
 	private int	maxLineBreaks;

+	private String username; //only registered users can change crunch settings

 	private ContentExtractorSettings mFilter;

@@ -72,6 +77,9 @@ public class SettingsBean implements Serializable {
 	}


+	public void setUsername(String name){
+		username = name;
+	}


 	public void setAppendLinks(String appendLinks) {
@@ -442,6 +450,10 @@ public class SettingsBean implements Serializable {
 	 * GET methods
 	 *************************************************************/

+	public String getUsername(){
+		return username;
+	}
+
 	public String getAppendLinks() {
 		return Boolean.toString(appendLinks);
 	}
@@ -652,8 +664,8 @@ public class SettingsBean implements Serializable {
 		mFilter.changeSetting(ContentExtractorConstants.IGNORE_STYLES, Boolean.toString(ignoreStyles));
 		mFilter.changeSetting(ContentExtractorConstants.IGNORE_CELL_WIDTH, Boolean.toString(ignoreTableCellWidths));

+		mFilter.changeSetting(ContentExtractorConstants.REMOVE_EMPTY_TABLES, Boolean.toString(removeEmptyTables));
 		if (removeEmptyTables) {
-			mFilter.changeSetting(ContentExtractorConstants.REMOVE_EMPTY_TABLES, Boolean.toString(removeEmptyTables));
 			mFilter.changeSetting(ContentExtractorConstants.SUBSTANCE_BUTTON, Boolean.toString(substanceButton));
 			mFilter.changeSetting(ContentExtractorConstants.SUBSTANCE_FORM, Boolean.toString(substanceForm));
 			mFilter.changeSetting(ContentExtractorConstants.SUBSTANCE_IFRAME, Boolean.toString(substanceIFrame));
@@ -664,8 +676,7 @@ public class SettingsBean implements Serializable {
 			mFilter.changeSetting(ContentExtractorConstants.SUBSTANCE_TEXTAREA, Boolean.toString(substanceTextarea));
 			mFilter.changeSetting(ContentExtractorConstants.SUBSTANCE_MIN_TEXT_LENGTH, Integer.toString(minimumTextLength));
 		} //if
-		else
-			mFilter.changeSetting(ContentExtractorConstants.REMOVE_EMPTY_TABLES, Boolean.toString(removeEmptyTables));
+

 		mFilter.changeSetting(ContentExtractorConstants.IGNORE_EMBED_TAGS, Boolean.toString(ignoreEmbed));
 		mFilter.changeSetting(ContentExtractorConstants.IGNORE_FLASH, Boolean.toString(ignoreFlash));
@@ -676,11 +687,63 @@ public class SettingsBean implements Serializable {



-		 mFilter.save("/eclipse/workspace/crunch3/config/content.ini");
-		 if(Crunch3.mainControl != null)
-		 Crunch3.mainControl.loadFile("/eclipse/workspace/crunch3/config/content.ini");
-		//return mFilter.getSetting(ContentExtractorConstants.LINK_TEXT_REMOVAL_RATIO);
+		 mFilter.save("/home/hila/eclipse/workspace/crunch3/users/" + username +".ini");
+

 	}

+
+	public void loadUserSettings(String user){
+
+		if(user !=null){
+
+		mFilter = ContentExtractorSettings.getInstance();
+		mFilter.changeFile("/home/hila/eclipse/workspace/crunch3/users/" + user +".ini");
+
+
+		ignoreAds = (mFilter.getSetting(ContentExtractorConstants.IGNORE_ADS).equals("true"));
+		ignoreScripts = (mFilter.getSetting(ContentExtractorConstants.IGNORE_SCRIPTS).equals("true"));
+		ignoreNoscript=(mFilter.getSetting(ContentExtractorConstants.IGNORE_NOSCRIPT_TAGS).equals("true"));
+		ignoreExternalStylesheets=(mFilter.getSetting(ContentExtractorConstants.IGNORE_EXTERNAL_STYLESHEETS).equals("true"));
+		ignoreStyles=(mFilter.getSetting(ContentExtractorConstants.IGNORE_STYLES).equals("true"));
+		ignoreStyleAttributes=(mFilter.getSetting(ContentExtractorConstants.IGNORE_STYLE_ATTRIBUTES).equals("true"));
+		ignoreStyleInDiv=(mFilter.getSetting(ContentExtractorConstants.IGNORE_DIV_STYLES).equals("true"));
+	    ignoreImages=(mFilter.getSetting(ContentExtractorConstants.IGNORE_IMAGES).equals("true"));
+		displayAltTags = (mFilter.getSetting(ContentExtractorConstants.DISPLAY_IMAGE_ALTS).equals("true"));
+		ignoreImageLinks=(mFilter.getSetting(ContentExtractorConstants.IGNORE_IMAGE_LINKS).equals("true"));
+		displayImageLinkAlts=(mFilter.getSetting(ContentExtractorConstants.DISPLAY_IMAGE_LINK_ALTS).equals("true"));
+		ignoreTextLinks=(mFilter.getSetting(ContentExtractorConstants.IGNORE_TEXT_LINKS).equals("true"));
+		ignoreForms=(mFilter.getSetting(ContentExtractorConstants.IGNORE_FORMS).equals("true"));
+		ignoreInput=(mFilter.getSetting(ContentExtractorConstants.IGNORE_INPUT_TAGS).equals("true"));
+		ignoreButton=(mFilter.getSetting(ContentExtractorConstants.IGNORE_BUTTON_TAGS).equals("true"));
+		ignoreSelect=(mFilter.getSetting(ContentExtractorConstants.IGNORE_SELECT_TAGS).equals("true"));
+		ignoreMeta=(mFilter.getSetting(ContentExtractorConstants.IGNORE_META).equals("true"));
+		ignoreIframe=(mFilter.getSetting(ContentExtractorConstants.IGNORE_IFRAME_TAGS).equals("true"));
+		ignoreTableCellWidths=(mFilter.getSetting(ContentExtractorConstants.IGNORE_CELL_WIDTH).equals("true"));
+		ignoreEmbed=(mFilter.getSetting(ContentExtractorConstants.IGNORE_EMBED_TAGS).equals("true"));
+		ignoreFlash=(mFilter.getSetting(ContentExtractorConstants.IGNORE_FLASH).equals("true"));
+		ignoreLinkLists=(mFilter.getSetting(ContentExtractorConstants.IGNORE_LINK_CELLS).equals("true"));
+
+		ignoreLLTextLinks=(mFilter.getSetting(ContentExtractorConstants.LC_IGNORE_TEXT_LINKS).equals("true"));
+		ignoreLLImageLinks=(mFilter.getSetting(ContentExtractorConstants.LC_IGNORE_IMAGE_LINKS).equals("true"));
+		ignoreOnlyTextAndLinks=(mFilter.getSetting(ContentExtractorConstants.LC_ONLY_LINKS_AND_TEXT).equals("true"));
+		linkTextRatio=Double.parseDouble(mFilter.getSetting(ContentExtractorConstants.LINK_TEXT_REMOVAL_RATIO));
+		removeEmptyTables=(mFilter.getSetting(ContentExtractorConstants.REMOVE_EMPTY_TABLES).equals("true"));
+		substanceImage=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_IMAGE).equals("true"));
+		substanceTextarea=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_TEXTAREA).equals("true"));
+		substanceLinks=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_LINKS).equals("true"));
+		substanceButton=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_BUTTON).equals("true"));
+		substanceInput=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_INPUT).equals("true"));
+		substanceForm=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_FORM).equals("true"));
+		substanceSelect=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_SELECT).equals("true"));
+		substanceIFrame=(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_IFRAME).equals("true"));
+		minimumTextLength = Integer.parseInt(mFilter.getSetting(ContentExtractorConstants.SUBSTANCE_MIN_TEXT_LENGTH));
+        htmlOutput= (!mFilter.getSetting(ContentExtractorConstants.ONLY_TEXT).equals("true"));
+		textOutput=(mFilter.getSetting(ContentExtractorConstants.ONLY_TEXT).equals("true"));
+		appendLinks=(mFilter.getSetting(ContentExtractorConstants.ADD_LINKS_TO_BOTTOM).equals("true"));
+		limitLineBreaks=(mFilter.getSetting(ContentExtractorConstants.LIMIT_LINEBREAKS).equals("true"));
+		maxLineBreaks=Integer.parseInt(mFilter.getSetting(ContentExtractorConstants.MAX_LINEBREAKS));
+		}
+	}
+
 }
diff --git a/src/psl/crunch3/web/SettingsServlet.java b/src/psl/crunch3/web/SettingsServlet.java
index a378609..7acaa00 100644
--- a/src/psl/crunch3/web/SettingsServlet.java
+++ b/src/psl/crunch3/web/SettingsServlet.java
@@ -2,6 +2,7 @@ package psl.crunch3.web;

 import javax.servlet.*;
 import javax.servlet.http.*;
+
 import java.io.*;

 public class SettingsServlet extends HttpServlet {
@@ -77,24 +78,36 @@ public class SettingsServlet extends HttpServlet {
      b.setIgnoreFlash((request.getParameter("ignoreFlash")));


-
-     b.commitSettings();
-
-
-    response.setContentType(CONTENT_TYPE);
-
-    PrintWriter out = response.getWriter();
-    out.println(DOC_TYPE);
-    out.println("<html>");
-    out.println("<head> <title>test test</title> </head>");
-    out.println("<body> <H2> " + "Changes Submitted" + "</H2> </body></html>");
-
+     Cookie[] cookies = request.getCookies();
+
+     //   if no cookies were found, the user isn't logged in, redirect to login page
+     if(cookies == null){
+    	 RequestDispatcher r = getServletContext().getRequestDispatcher(
+         "/login.htm");
+    	 r.forward(request, response);
+     }
+     else{
+    	 for (int i=0; i<cookies.length;i++){
+    		 if (((cookies[i]).getName()).equals("crunch")){
+    		 	b.setUsername((cookies[i]).getValue());
+    		 	break;
+    		 }
+    	 }
+
+
+
+
+    	 b.commitSettings();
+    	 HttpSession session = (request.getSession(true));
+      	 session.setAttribute("name",b.getUsername());
+    	 RequestDispatcher r = getServletContext().getRequestDispatcher(
+         "/interface.jsp");
+    	 r.forward(request, response);
+     }


-    /**  RequestDispatcher r = getServletContext().getRequestDispatcher(
-          "/Form.jsp");
-      r.forward(request, response);
-**/
+
+



diff --git a/src/psl/crunch3/web/Test.java b/src/psl/crunch3/web/Test.java
index 16364d1..bc581aa 100644
--- a/src/psl/crunch3/web/Test.java
+++ b/src/psl/crunch3/web/Test.java
@@ -1,5 +1,8 @@
 package psl.crunch3.web;

+import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileOutputStream;
 import java.sql.Connection;
 import java.sql.DriverManager;
 import java.sql.ResultSet;
@@ -40,6 +43,23 @@ public class Test {
 	            System.out.println(str);
 	            stmt.execute(str);
 	            System.out.println("point 4");
+
+
+	            File fromFile = new File("config" + File.separator +  "level6.ini");
+				 File toFile = new File("users" + File.separator + "test" + ".ini");
+
+				 FileInputStream from = new FileInputStream(fromFile);
+				 FileOutputStream to = new FileOutputStream(toFile);
+
+				 byte[] buff = new byte[4096];
+				 int i;
+
+				 while ((i = from.read(buff))!=-1){
+					 to.write(buff, 0,i);
+				 }
+				 from.close();
+				 to.close();
+

 	     }
 		 catch (Exception ex) {
@@ -74,4 +94,29 @@ public class Test {

 	}

+	public void createUserPrefFile(){
+
+		 try{
+			 File fromFile = new File("config" + File.separator +  "level6.ini");
+			 File toFile = new File("users" + File.separator + "test" + ".ini");
+
+			 FileInputStream from = new FileInputStream(fromFile);
+			 FileOutputStream to = new FileOutputStream(toFile);
+
+			 byte[] buff = new byte[4096];
+			 int i;
+
+			 while ((i = from.read(buff))!=-1){
+				 to.write(buff, 0,i);
+			 }
+			 from.close();
+			 to.close();
+			 //return true;
+		 }
+		 catch(Exception e){
+			 e.printStackTrace();
+		 }
+	}
+
+
 }
diff --git a/src/psl/crunch3/web/interface_files/crunch.css b/src/psl/crunch3/web/interface_files/crunch.css
deleted file mode 100644
index 9132c34..0000000
--- a/src/psl/crunch3/web/interface_files/crunch.css
+++ /dev/null
@@ -1,60 +0,0 @@
-BODY {
-	BACKGROUND-COLOR: #84939a; TEXT-ALIGN: center
-}
-DIV#wrapper {
-	WIDTH: 740px; TEXT-ALIGN: left; align: center
-}
-DIV#main {
-	WIDTH: 740px; HEIGHT: 800px; BACKGROUND-COLOR: white
-}
-A:link {
-	FONT-WEIGHT: bold; COLOR: black; TEXT-DECORATION: none
-}
-A:visited {
-	FONT-WEIGHT: bold; COLOR: black; TEXT-DECORATION: none
-}
-A:hover {
-	COLOR: #fdc255
-}
-.box {
-	PADDING-RIGHT: 12px; PADDING-LEFT: 0px; BACKGROUND: url(borders.gif) #84939a repeat-y 100% 0px; PADDING-BOTTOM: 0px; PADDING-TOP: 0px
-}
-.bi {
-	PADDING-RIGHT: 0px; PADDING-LEFT: 12px; BACKGROUND: url(borders.gif) #fff repeat-y 0px 0px; PADDING-BOTTOM: 0px; PADDING-TOP: 0px
-}
-.bt {
-	BACKGROUND: url(box2.gif) no-repeat 100% 0px; MARGIN: 0px -12px; HEIGHT: 17px
-}
-.bt DIV {
-	BACKGROUND: url(box2.gif) no-repeat 0px 0px; WIDTH: 18px; HEIGHT: 17px
-}
-.bb {
-	BACKGROUND: url(box2.gif) no-repeat 100% 100%; MARGIN: 0px -12px; HEIGHT: 17px
-}
-.bb DIV {
-	BACKGROUND: url(box2.gif) no-repeat 0px 100%; WIDTH: 18px; HEIGHT: 17px
-}
-.box H1 {
-	PADDING-RIGHT: 10px; PADDING-LEFT: 10px; BACKGROUND: #fdc255; PADDING-BOTTOM: 0.3em; MARGIN: 0px; FONT: bold 1.2em/1 Arial, Helvetica, sans-serif; PADDING-TOP: 0.3em
-}
-.box P {
-	PADDING-RIGHT: 10px; PADDING-LEFT: 10px; BACKGROUND: #fff; PADDING-BOTTOM: 4px; MARGIN: 0px; PADDING-TOP: 4px
-}
-.box UL {
-	PADDING-RIGHT: 10px; PADDING-LEFT: 10px; BACKGROUND: #fff; PADDING-BOTTOM: 4px; MARGIN: 0px; PADDING-TOP: 4px
-}
-.box TABLE {
-	PADDING-RIGHT: 10px; PADDING-LEFT: 10px; BACKGROUND: #fff; PADDING-BOTTOM: 4px; MARGIN: 0px; PADDING-TOP: 4px
-}
-.box FORM {
-	PADDING-RIGHT: 10px; PADDING-LEFT: 10px; BACKGROUND: #fff; PADDING-BOTTOM: 4px; MARGIN: 0px; PADDING-TOP: 4px
-}
-.box LI {
-	PADDING-RIGHT: 20px; PADDING-LEFT: 20px; BACKGROUND: #fff; PADDING-BOTTOM: 20px; MARGIN: 0px 0px 0px 2em; PADDING-TOP: 20px
-}
-.box IMG {
-	BACKGROUND: #fff
-}
-TD.settd {
-	WIDTH: 50%; HEIGHT: 20px
-}
diff --git a/src/psl/crunch3/web/interface_files/menu_r1_c1.gif b/src/psl/crunch3/web/interface_files/menu_r1_c1.gif
deleted file mode 100644
index 71671f4..0000000
Binary files a/src/psl/crunch3/web/interface_files/menu_r1_c1.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/menu_r1_c2.gif b/src/psl/crunch3/web/interface_files/menu_r1_c2.gif
deleted file mode 100644
index 535716b..0000000
Binary files a/src/psl/crunch3/web/interface_files/menu_r1_c2.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/menu_r1_c3.gif b/src/psl/crunch3/web/interface_files/menu_r1_c3.gif
deleted file mode 100644
index 306beea..0000000
Binary files a/src/psl/crunch3/web/interface_files/menu_r1_c3.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/menu_r1_c4.gif b/src/psl/crunch3/web/interface_files/menu_r1_c4.gif
deleted file mode 100644
index b379212..0000000
Binary files a/src/psl/crunch3/web/interface_files/menu_r1_c4.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/menu_r1_c5.gif b/src/psl/crunch3/web/interface_files/menu_r1_c5.gif
deleted file mode 100644
index 93e7af1..0000000
Binary files a/src/psl/crunch3/web/interface_files/menu_r1_c5.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/spacer.gif b/src/psl/crunch3/web/interface_files/spacer.gif
deleted file mode 100644
index fc25609..0000000
Binary files a/src/psl/crunch3/web/interface_files/spacer.gif and /dev/null differ
diff --git a/src/psl/crunch3/web/interface_files/title.png b/src/psl/crunch3/web/interface_files/title.png
deleted file mode 100644
index 7d7723c..0000000
Binary files a/src/psl/crunch3/web/interface_files/title.png and /dev/null differ
diff --git a/users/abc1.ini b/users/abc1.ini
new file mode 100644
index 0000000..a221eaf
--- /dev/null
+++ b/users/abc1.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:49:45 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Print\ Only\ Text=false
diff --git a/users/gabriela.ini b/users/gabriela.ini
new file mode 100644
index 0000000..0d44aa1
--- /dev/null
+++ b/users/gabriela.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Aug 11 11:59:24 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=false
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=false
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=false
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=false
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=false
+Ignore\ Flash=false
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=false
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=false
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=false
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=false
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=false
+Ignore\ Link\ Lists=false
+Print\ Only\ Text=false
diff --git a/users/hila.ini b/users/hila.ini
new file mode 100644
index 0000000..a221eaf
--- /dev/null
+++ b/users/hila.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:49:45 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Print\ Only\ Text=false
diff --git a/users/hila1.ini b/users/hila1.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hila1.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/hila123.ini b/users/hila123.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hila123.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/hila2.ini b/users/hila2.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hila2.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/hila3.ini b/users/hila3.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hila3.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/hila4.ini b/users/hila4.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hila4.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/hila5.ini b/users/hila5.ini
new file mode 100644
index 0000000..dc5fc62
--- /dev/null
+++ b/users/hila5.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Tue Aug 16 14:21:37 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Images=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Link\ Lists=true
+Print\ Only\ Text=false
diff --git a/users/hilabecker.ini b/users/hilabecker.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/hilabecker.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/null.ini b/users/null.ini
new file mode 100644
index 0000000..091f523
--- /dev/null
+++ b/users/null.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Aug 11 14:32:53 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=false
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=false
+Display\ Image\ Link\ ALTs=false
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=false
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=false
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=false
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=false
+Ignore\ Flash=false
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=false
+Ignore\ Forms=false
+Display\ Image\ ALTs=false
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Minimum\ text\ length\ as\ substance=1
+Remove\ Empty\ Tables=false
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=false
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=false
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=false
+Ignore\ Link\ Lists=false
+Print\ Only\ Text=false
diff --git a/users/sb.ini b/users/sb.ini
new file mode 100644
index 0000000..c7997f4
--- /dev/null
+++ b/users/sb.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:58:56 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=false
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=false
+Link/Text\ Removal\ Ratio=0.75
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/shlomo.ini b/users/shlomo.ini
new file mode 100644
index 0000000..6a75078
--- /dev/null
+++ b/users/shlomo.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Fri Aug 12 14:35:20 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Images=false
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Link\ Lists=false
+Print\ Only\ Text=false
diff --git a/users/suhit.ini b/users/suhit.ini
new file mode 100644
index 0000000..a221eaf
--- /dev/null
+++ b/users/suhit.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:49:45 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Print\ Only\ Text=false
diff --git a/users/test.ini b/users/test.ini
new file mode 100644
index 0000000..a221eaf
--- /dev/null
+++ b/users/test.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:49:45 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Print\ Only\ Text=false
diff --git a/users/test1.ini b/users/test1.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/test1.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/test12.ini b/users/test12.ini
new file mode 100644
index 0000000..77b30f1
--- /dev/null
+++ b/users/test12.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Tue Aug 16 12:13:01 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=false
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=false
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=false
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=false
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=false
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Images=false
+Link/Text\ Removal\ Ratio=0.0
+Ignore\ Link\ Lists=true
+Print\ Only\ Text=false
diff --git a/users/test2.ini b/users/test2.ini
new file mode 100644
index 0000000..a221eaf
--- /dev/null
+++ b/users/test2.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:49:45 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Images=true
+Print\ Only\ Text=false
diff --git a/users/test3.ini b/users/test3.ini
new file mode 100644
index 0000000..57ffc11
--- /dev/null
+++ b/users/test3.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Aug 18 12:44:43 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=true
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Images=true
+Link/Text\ Removal\ Ratio=0.75
+Ignore\ Link\ Lists=true
+Print\ Only\ Text=false
diff --git a/users/test4.ini b/users/test4.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/test4.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/test83.ini b/users/test83.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/test83.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/test88.ini b/users/test88.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/test88.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/tester.ini b/users/tester.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/tester.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/testing123.ini b/users/testing123.ini
new file mode 100644
index 0000000..c426834
--- /dev/null
+++ b/users/testing123.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Feb 10 18:55:25 EST 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=false
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=false
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=false
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=false
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=false
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=false
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=false
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Link\ Lists=true
+Link/Text\ Removal\ Ratio=0.5
+Ignore\ Images=false
+Print\ Only\ Text=false
diff --git a/users/yael.ini b/users/yael.ini
new file mode 100644
index 0000000..ec925ba
--- /dev/null
+++ b/users/yael.ini
@@ -0,0 +1,42 @@
+#Content Extractor Settings File
+#Thu Aug 18 12:31:18 EDT 2005
+<A>\ tags\ are\ substance=true
+<FORM>\ tags\ are\ substance=true
+Ignore\ Image\ Links=false
+Ignore\ Meta\ Tags=true
+Display\ Image\ Link\ ALTs=true
+Ignore\ Text\ Links=true
+<INPUT>\ tags\ are\ substance=true
+Ignore\ <IFRAME>\ Tags=true
+<BUTTON>\ tags\ are\ substance=true
+Ignore\ All\ Advertisements=true
+<SELECT>\ tags\ are\ substance=true
+Ignore\ External\ Stylesheets=true
+<IFRAME>\ tags\ are\ substance=true
+Ignore\ <EMBED>\ tags=true
+Ignore\ Styles=true
+Ignore\ Only\ Links\ and\ Text\ in\ Link\ Lists=true
+Ignore\ <INPUT>\ Tags=true
+Ignore\ Flash=true
+Ignore\ Image\ Links\ in\ Link\ Lists=true
+<IMG>\ tags\ are\ substance=true
+<TEXTAREA>\ tags\ are\ substance=true
+Ignore\ Scripts=true
+Ignore\ Forms=true
+Display\ Image\ ALTs=true
+Maximum\ Number\ of\ Line\ Breaks=2
+Ignore\ <BUTTON>\ Tags=true
+Limit\ Number\ of\ Line\ Breaks=false
+Ignore\ Style\ Attribute\ in\ <DIV>\ Tags=true
+Ignore\ <NOSCRIPT>\ Tags=true
+Add\ removed\ links\ to\ bottom\ of\ the\ page=false
+Minimum\ text\ length\ as\ substance=12
+Remove\ Empty\ Tables=true
+Ignore\ Text\ Links\ in\ Link\ Lists=true
+Ignore\ Table\ Cell\ Widths=true
+Ignore\ Style\ Attributes=true
+Ignore\ <SELECT>\ Tags=true
+Ignore\ Images=false
+Link/Text\ Removal\ Ratio=0.25
+Ignore\ Link\ Lists=true
+Print\ Only\ Text=false