On a brand new instance of Brisk on an Ubuntu server, when I try to run a job I get the following error:
Exception in thread "main" java.io.IOException: No FileSystem for scheme: cfs
at org.apache.hadoop.fs.FileSystem.createFileSystem(FileSystem.java:1307)
at org.apache.hadoop.fs.FileSystem.access$100(FileSystem.java:65)
...
I read on the forums that this can be caused by Brisk's core-site.xml not being in the classpath, but I checked and it is in the classpath. Here's the classpath being used to launch Brisk via jsvc:
/usr/share/brisk/brisk.jar
/usr/share/brisk/common/log4j-1.2.16.jar
/usr/share/brisk/common/slf4j-api-1.6.1.jar
/usr/share/brisk/common/slf4j-log4j12-1.6.1.jar
/etc/brisk/cassandra
/usr/share/brisk/cassandra/lib/antlr-2.7.7.jar
/usr/share/brisk/cassandra/lib/antlr-3.1.3.jar
/usr/share/brisk/cassandra/lib/antlr-runtime-3.1.3.jar
/usr/share/brisk/cassandra/lib/apache-cassandra-0.8.1-brisk1-beta2.jar
/usr/share/brisk/cassandra/lib/apache-cassandra-cql-1.0.1-20110620.040412-84.jar
/usr/share/brisk/cassandra/lib/apache-cassandra-thrift-0.8.1-brisk1-beta2.jar
/usr/share/brisk/cassandra/lib/avro-1.4.0-cassandra-1.jar
/usr/share/brisk/cassandra/lib/commons-cli-1.1.jar
/usr/share/brisk/cassandra/lib/commons-codec-1.2.jar
/usr/share/brisk/cassandra/lib/commons-collections-3.2.1.jar
/usr/share/brisk/cassandra/lib/commons-lang-2.4.jar
/usr/share/brisk/cassandra/lib/concurrentlinkedhashmap-lru-1.1.jar
/usr/share/brisk/cassandra/lib/guava-r08.jar
/usr/share/brisk/cassandra/lib/high-scale-lib-1.1.1.jar
/usr/share/brisk/cassandra/lib/jackson-core-asl-1.4.0.jar
/usr/share/brisk/cassandra/lib/jackson-mapper-asl-1.4.0.jar
/usr/share/brisk/cassandra/lib/jamm-0.2.1.jar
/usr/share/brisk/cassandra/lib/jetty-6.1.21.jar
/usr/share/brisk/cassandra/lib/jetty-util-6.1.21.jar
/usr/share/brisk/cassandra/lib/jline-0.9.94.jar
/usr/share/brisk/cassandra/lib/joda-time-1.6.2.jar
/usr/share/brisk/cassandra/lib/json-simple-1.1.jar
/usr/share/brisk/cassandra/lib/jug-2.0.0-asl.jar
/usr/share/brisk/cassandra/lib/libthrift-0.6.0.jar
/usr/share/brisk/cassandra/lib/servlet-api-2.5-20081211.jar
/usr/share/brisk/cassandra/lib/slf4j-api-1.6.1.jar
/usr/share/brisk/cassandra/lib/snakeyaml-1.6.jar
/usr/share/brisk/cassandra/lib/snappy-java-1.0.3-20110604.005740-2.jar
/usr/share/brisk/cassandra/lib/stringtemplate-3.2.jar
/usr/share/brisk/brisk.jar
/usr/share/brisk/hive/lib/hive-cassandra-handler-0.7.0-brisk1-beta2.jar
/usr/share/brisk/hadoop
/usr/share/brisk/hadoop
/etc/brisk/hadoop
/usr/share/brisk/hadoop/*.jar
/usr/share/brisk/hadoop/lib/ant-1.6.5.jar
/usr/share/brisk/hadoop/lib/commons-beanutils-1.7.0.jar
/usr/share/brisk/hadoop/lib/commons-beanutils-core-1.8.0.jar
/usr/share/brisk/hadoop/lib/commons-cli-1.2.jar
/usr/share/brisk/hadoop/lib/commons-codec-1.4.jar
/usr/share/brisk/hadoop/lib/commons-collections-3.2.1.jar
/usr/share/brisk/hadoop/lib/commons-configuration-1.6.jar
/usr/share/brisk/hadoop/lib/commons-digester-1.8.jar
/usr/share/brisk/hadoop/lib/commons-el-1.0.jar
/usr/share/brisk/hadoop/lib/commons-httpclient-3.0.1.jar
/usr/share/brisk/hadoop/lib/commons-lang-2.4.jar
/usr/share/brisk/hadoop/lib/commons-logging-1.0.4.jar
/usr/share/brisk/hadoop/lib/commons-math-2.1.jar
/usr/share/brisk/hadoop/lib/commons-net-1.4.1.jar
/usr/share/brisk/hadoop/lib/core-3.1.1.jar
/usr/share/brisk/hadoop/lib/ftplet-api-1.0.0.jar
/usr/share/brisk/hadoop/lib/ftpserver-core-1.0.0.jar
/usr/share/brisk/hadoop/lib/ftpserver-deprecated-1.0.0-M2.jar
/usr/share/brisk/hadoop/lib/hadoop-core-0.20.203.1-brisk1-beta2.jar
/usr/share/brisk/hadoop/lib/hadoop-examples-0.20.203.1-brisk1-beta2.jar
/usr/share/brisk/hadoop/lib/hadoop-fairscheduler-0.20.203.1-brisk1.jar
/usr/share/brisk/hadoop/lib/hadoop-streaming-0.20.203.1-brisk1-beta2.jar
/usr/share/brisk/hadoop/lib/hadoop-test-0.20.203.1-brisk1-beta2.jar
/usr/share/brisk/hadoop/lib/hadoop-tools-0.20.203.1-brisk1-beta2.jar
/usr/share/brisk/hadoop/lib/hsqldb-1.8.0.10.jar
/usr/share/brisk/hadoop/lib/jasper-compiler-5.5.12.jar
/usr/share/brisk/hadoop/lib/jasper-runtime-5.5.12.jar
/usr/share/brisk/hadoop/lib/jets3t-0.7.1.jar
/usr/share/brisk/hadoop/lib/jetty-6.1.26.jar
/usr/share/brisk/hadoop/lib/jetty-util-6.1.26.jar
/usr/share/brisk/hadoop/lib/jsp-2.1-6.1.14.jar
/usr/share/brisk/hadoop/lib/jsp-api-2.1-6.1.14.jar
/usr/share/brisk/hadoop/lib/junit-3.8.1.jar
/usr/share/brisk/hadoop/lib/kfs-0.3.jar
/usr/share/brisk/hadoop/lib/mina-core-2.0.0-M5.jar
/usr/share/brisk/hadoop/lib/oro-2.0.8.jar
/usr/share/brisk/hadoop/lib/servlet-api-2.5-20081211.jar
/usr/share/brisk/hadoop/lib/servlet-api-2.5-6.1.14.jar
/usr/share/brisk/hadoop/lib/xmlenc-0.52.jar
/usr/share/java/jna.jar
/usr/share/java/commons-daemon.jar
and for reference, the code used to create the job:
Job job = new Job();
job.setJarByClass(ComputeAttentionBasedScores.class);
job.setMapperClass(MapOutgoing.class);
job.setReducerClass(CombineOutgoing.class);
job.setMapOutputKeyClass(Text.class);
job.setMapOutputValueClass(MappedValue.class);
job.setOutputKeyClass(ByteBuffer.class);
job.setOutputValueClass(List.class);
job.setInputFormatClass(ColumnFamilyInputFormat.class);
ConfigHelper.setRpcPort(job.getConfiguration(), String.valueOf(Constants.port));
ConfigHelper.setInitialAddress(job.getConfiguration(), Constants.hostName);
job.getConfiguration().set("cassandra.input.keyspace.username", Constants.user);
job.getConfiguration().set("cassandra.input.keyspace.passwd", Constants.pwd);
job.getCredentials().addSecretKey(new Text("cassandra.input.keyspace.username"), ByteBufferUtil.bytes(Constants.user).array());
job.getCredentials().addSecretKey(new Text("cassandra.input.keyspace.passwd"), ByteBufferUtil.bytes(Constants.pwd).array());
ConfigHelper.setPartitioner(job.getConfiguration(), "org.apache.cassandra.dht.RandomPartitioner");
ConfigHelper.setInputColumnFamily(job.getConfiguration(), Constants.keySpace, Constants.MessageByCultCF);
ConfigHelper.setInputSlicePredicate(job.getConfiguration(), new SlicePredicate().setSlice_range(new SliceRange(ByteBufferUtil.bytes(""), ByteBufferUtil.bytes(""), false, 100))); //TODO: here we return max. 100 columns.
job.setOutputFormatClass(ColumnFamilyOutputFormat.class);
ConfigHelper.setOutputColumnFamily(job.getConfiguration(), Constants.keySpace, Constants.outgoingCF);
job.waitForCompletion(true);
