<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="bbPress/1.0.3" -->
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom">
	<channel>
		<title>DataStax Support Forums &#187; Topic: Hive exploding on a count(*) but works with a select *</title>
		<link>http://www.datastax.com/support-forums/topic/hive-exploding-on-a-count-but-works-with-a-select</link>
		<description>Software, Support, and Training for Apache Cassandra</description>
		<language>en-US</language>
		<pubDate>Sat, 25 May 2013 17:05:37 +0000</pubDate>
		<generator>http://bbpress.org/?v=1.0.3</generator>
		<textInput>
			<title><![CDATA[Search]]></title>
			<description><![CDATA[Search all topics from these forums.]]></description>
			<name>q</name>
			<link>http://www.datastax.com/support-forums/search.php</link>
		</textInput>
		<atom:link href="http://www.datastax.com/support-forums/rss/topic/hive-exploding-on-a-count-but-works-with-a-select" rel="self" type="application/rss+xml" />

		<item>
			<title>Anonymous on "Hive exploding on a count(*) but works with a select *"</title>
			<link>http://www.datastax.com/support-forums/topic/hive-exploding-on-a-count-but-works-with-a-select#post-573</link>
			<pubDate>Fri, 21 Oct 2011 11:18:13 +0000</pubDate>
			<dc:creator>Anonymous</dc:creator>
			<guid isPermaLink="false">573@http://www.datastax.com/support-forums/</guid>
			<description>&#60;p&#62;I have been trying to do a query and it is exploding in a fantastic fashion.  Below is my test case&#60;/p&#62;
&#60;p&#62;Hive history file=/tmp/vachon/hive_job_log_vachon_201110211052_1405555749.txt&#60;br /&#62;
hive&#38;gt; CREATE EXTERNAL TABLE TESTTABLE&#60;br /&#62;
    &#38;gt; (row_key string, column_name string, value string)&#60;br /&#62;
    &#38;gt; STORED BY 'org.apache.hadoop.hive.cassandra.CassandraStorageHandler'&#60;br /&#62;
    &#38;gt; WITH SERDEPROPERTIES (&#34;cassandra.ks.name&#34; = &#34;Greyhound&#34;);&#60;br /&#62;
OK&#60;br /&#62;
Time taken: 1.458 seconds&#60;/p&#62;
&#60;p&#62;&#38;gt;&#38;gt; OK so Hive works and has write it seems&#60;/p&#62;
&#60;p&#62;hive&#38;gt; SELECT * FROM greyhound.PlayerEvents limit 10;&#60;br /&#62;
OK&#60;br /&#62;
[10 Records worth of output]&#60;br /&#62;
Time taken: 2.365 seconds&#60;/p&#62;
&#60;p&#62;&#38;gt;&#38;gt; OK so Hive can read as well&#60;/p&#62;
&#60;p&#62;So now I know I can read and write I want to do: &#60;/p&#62;
&#60;p&#62;SELECT count(*) FROM greyhound.PlayerEvents;&#60;/p&#62;
&#60;p&#62;I get this output in syslog&#60;/p&#62;
&#60;p&#62;n/jobcache/job_201110210214_0001/jars/, file:/tmp/hadoop-cassandra/mapred/local/taskTracker/vachon/jobcache/job_201110210214_0001/attempt_201110210214_0001_m_000000_0/work/]&#60;br /&#62;
2011-10-21 02:15:29,463 INFO org.apache.hadoop.hive.ql.exec.MapOperator: Adding alias greyhound.playerevents to work list for file cfs://null/user/hive/warehouse/greyhound.db/playerevents&#60;br /&#62;
2011-10-21 02:15:29,465 INFO org.apache.hadoop.hive.ql.exec.MapOperator: dump TS struct&#38;lt;player_id:string,application_event_id:string,id:string,event_data:string&#38;gt;&#60;br /&#62;
2011-10-21 02:15:29,466 INFO ExecMapper:&#60;br /&#62;
&#38;lt;MAP&#38;gt;Id =7&#60;br /&#62;
  &#38;lt;Children&#38;gt;&#60;br /&#62;
    &#38;lt;TS&#38;gt;Id =0&#60;br /&#62;
      &#38;lt;Children&#38;gt;&#60;br /&#62;
        &#38;lt;SEL&#38;gt;Id =1&#60;br /&#62;
          &#38;lt;Children&#38;gt;&#60;br /&#62;
            &#38;lt;GBY&#38;gt;Id =2&#60;br /&#62;
              &#38;lt;Children&#38;gt;&#60;br /&#62;
                &#38;lt;RS&#38;gt;Id =3&#60;br /&#62;
                  &#38;lt;Parent&#38;gt;Id = 2 null&#38;lt;\Parent&#38;gt;&#60;br /&#62;
                &#38;lt;\RS&#38;gt;&#60;br /&#62;
              &#38;lt;\Children&#38;gt;&#60;br /&#62;
              &#38;lt;Parent&#38;gt;Id = 1 null&#38;lt;\Parent&#38;gt;&#60;br /&#62;
            &#38;lt;\GBY&#38;gt;&#60;br /&#62;
          &#38;lt;\Children&#38;gt;&#60;br /&#62;
          &#38;lt;Parent&#38;gt;Id = 0 null&#38;lt;\Parent&#38;gt;&#60;br /&#62;
        &#38;lt;\SEL&#38;gt;&#60;br /&#62;
      &#38;lt;\Children&#38;gt;&#60;br /&#62;
      &#38;lt;Parent&#38;gt;Id = 7 null&#38;lt;\Parent&#38;gt;&#60;br /&#62;
    &#38;lt;\TS&#38;gt;&#60;br /&#62;
  &#38;lt;\Children&#38;gt;&#60;br /&#62;
&#38;lt;\MAP&#38;gt;&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.MapOperator: Initializing Self 7 MAP&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: Initializing Self 0 TS&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: Operator 0 TS initialized&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: Initializing children of 0 TS&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: Initializing child 1 SEL&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: Initializing Self 1 SEL&#60;br /&#62;
2011-10-21 02:15:29,466 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: SELECT struct&#38;lt;player_id:string,application_event_id:string,id:string,event_data:string&#38;gt;&#60;br /&#62;
2011-10-21 02:15:29,469 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: Operator 1 SEL initialized&#60;br /&#62;
2011-10-21 02:15:29,469 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: Initializing children of 1 SEL&#60;br /&#62;
2011-10-21 02:15:29,469 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: Initializing child 2 GBY&#60;br /&#62;
2011-10-21 02:15:29,469 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: Initializing Self 2 GBY&#60;br /&#62;
2011-10-21 02:15:29,484 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: Operator 2 GBY initialized&#60;br /&#62;
2011-10-21 02:15:29,484 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: Initializing children of 2 GBY&#60;br /&#62;
2011-10-21 02:15:29,484 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: Initializing child 3 RS&#60;br /&#62;
2011-10-21 02:15:29,484 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: Initializing Self 3 RS&#60;br /&#62;
2011-10-21 02:15:29,488 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: Using tag = -1&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: Operator 3 RS initialized&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: Initialization Done 3 RS&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: Initialization Done 2 GBY&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: Initialization Done 1 SEL&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: Initialization Done 0 TS&#60;br /&#62;
2011-10-21 02:15:29,499 INFO org.apache.hadoop.hive.ql.exec.MapOperator: Initialization Done 7 MAP&#60;br /&#62;
2011-10-21 02:15:29,532 INFO org.apache.hadoop.hive.ql.exec.MapOperator: Processing path cfs://null/user/hive/warehouse/greyhound.db/playerevents&#60;br /&#62;
2011-10-21 02:15:29,532 INFO org.apache.hadoop.hive.ql.exec.MapOperator: Processing alias greyhound.playerevents for file cfs://null/user/hive/warehouse/greyhound.db/playerevents&#60;br /&#62;
2011-10-21 02:15:29,532 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 forwarding 1 rows&#60;br /&#62;
2011-10-21 02:15:29,533 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 forwarding 1 rows&#60;br /&#62;
2011-10-21 02:15:29,533 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 forwarding 1 rows&#60;br /&#62;
2011-10-21 02:15:29,533 INFO ExecMapper: ExecMapper: processing 1 rows: used memory = 129923416&#60;br /&#62;
2011-10-21 02:15:29,536 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 forwarding 10 rows&#60;br /&#62;
2011-10-21 02:15:29,536 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 forwarding 10 rows&#60;br /&#62;
2011-10-21 02:15:29,536 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 forwarding 10 rows&#60;br /&#62;
2011-10-21 02:15:29,536 INFO ExecMapper: ExecMapper: processing 10 rows: used memory = 129923416&#60;br /&#62;
2011-10-21 02:15:29,559 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 forwarding 100 rows&#60;br /&#62;
2011-10-21 02:15:29,559 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 forwarding 100 rows&#60;br /&#62;
2011-10-21 02:15:29,559 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 forwarding 100 rows&#60;br /&#62;
2011-10-21 02:15:29,559 INFO ExecMapper: ExecMapper: processing 100 rows: used memory = 130469504&#60;br /&#62;
2011-10-21 02:15:29,691 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 finished. closing...&#60;br /&#62;
2011-10-21 02:15:29,691 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 forwarded 415 rows&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.MapOperator: DESERIALIZE_ERRORS:0&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 finished. closing...&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 forwarded 415 rows&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 finished. closing...&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 forwarded 415 rows&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: 2 finished. closing...&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: 2 forwarded 0 rows&#60;br /&#62;
2011-10-21 02:15:29,692 WARN org.apache.hadoop.hive.ql.exec.GroupByOperator: Begin Hash Table flush at close: size = 1&#60;br /&#62;
2011-10-21 02:15:29,692 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: 2 forwarding 1 rows&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: 3 finished. closing...&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.ReduceSinkOperator: 3 forwarded 0 rows&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.GroupByOperator: 2 Close done&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.SelectOperator: 1 Close done&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.TableScanOperator: 0 Close done&#60;br /&#62;
2011-10-21 02:15:29,693 INFO org.apache.hadoop.hive.ql.exec.MapOperator: 7 Close done&#60;br /&#62;
2011-10-21 02:15:29,694 INFO ExecMapper: ExecMapper: processed 415 rows: used memory = 108402288&#60;br /&#62;
2011-10-21 02:15:29,700 INFO org.apache.hadoop.mapred.TaskLogsTruncater: Initializing logs' truncater with mapRetainSize=-1 and reduceRetainSize=-1&#60;br /&#62;
2011-10-21 02:15:29,715 WARN org.apache.hadoop.mapred.Child: Error running child&#60;br /&#62;
java.lang.NullPointerException&#60;br /&#62;
	at org.apache.hadoop.hive.cassandra.input.HiveCassandraStandardColumnInputFormat$2.next(HiveCassandraStandardColumnInputFormat.java:173)&#60;br /&#62;
	at org.apache.hadoop.hive.cassandra.input.HiveCassandraStandardColumnInputFormat$2.next(HiveCassandraStandardColumnInputFormat.java:111)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveRecordReader.doNext(HiveRecordReader.java:66)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveRecordReader.doNext(HiveRecordReader.java:32)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveContextAwareRecordReader.next(HiveContextAwareRecordReader.java:67)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.moveToNext(MapTask.java:236)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.next(MapTask.java:216)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:48)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:435)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask.run(MapTask.java:371)&#60;br /&#62;
	at org.apache.hadoop.mapred.Child$4.run(Child.java:259)&#60;br /&#62;
	at java.security.AccessController.doPrivileged(Native Method)&#60;br /&#62;
	at javax.security.auth.Subject.doAs(Subject.java:396)&#60;br /&#62;
	at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1059)&#60;br /&#62;
	at org.apache.hadoop.mapred.Child.main(Child.java:253)&#60;br /&#62;
2011-10-21 02:15:29,721 INFO org.apache.hadoop.mapred.Task: Runnning cleanup for the task&#60;/p&#62;
&#60;p&#62;&#38;gt;&#38;gt; OK so that explodes.  I try it on another brisk cluster and I get:&#60;/p&#62;
&#60;p&#62;java.lang.UnsupportedOperationException: This operation is not supported for Super Columns.&#60;br /&#62;
	at org.apache.cassandra.db.SuperColumn.value(SuperColumn.java:174)&#60;br /&#62;
	at org.apache.hadoop.hive.cassandra.input.HiveCassandraStandardColumnInputFormat$2.next(HiveCassandraStandardColumnInputFormat.java:242)&#60;br /&#62;
	at org.apache.hadoop.hive.cassandra.input.HiveCassandraStandardColumnInputFormat$2.next(HiveCassandraStandardColumnInputFormat.java:111)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveRecordReader.doNext(HiveRecordReader.java:66)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveRecordReader.doNext(HiveRecordReader.java:32)&#60;br /&#62;
	at org.apache.hadoop.hive.ql.io.HiveContextAwareRecordReader.next(HiveContextAwareRecordReader.java:67)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.moveToNext(MapTask.java:236)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.next(MapTask.java:216)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:48)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:435)&#60;br /&#62;
	at org.apache.hadoop.mapred.MapTask.run(MapTask.java:371)&#60;br /&#62;
	at org.apache.hadoop.mapred.Child$4.run(Child.java:259)&#60;br /&#62;
	at java.security.AccessController.doPrivileged(Native Method)&#60;br /&#62;
	at javax.security.auth.Subject.doAs(Subject.java:416)&#60;br /&#62;
	at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1059)&#60;br /&#62;
	at org.apache.hadoop.mapred.Child.main(Child.java:253)&#60;/p&#62;
&#60;p&#62;java.lang.Throwable: Child Error&#60;br /&#62;
	at org.apache.hadoop.mapred.TaskRunner.run(TaskRunner.java:271)&#60;br /&#62;
Caused by: java.io.IOException: Task process exit with nonzero status of 65.&#60;br /&#62;
	at org.apache.hadoop.mapred.TaskRunner.run(TaskRunner.java:258)&#60;/p&#62;
&#60;p&#62;&#38;gt;&#38;gt;So my overall question is this, what in particular isn't supported, also why are the two error messages different.&#60;/p&#62;
&#60;p&#62;Also I ran the select limit 10 query on our test enviroment and I get: &#34;Failed with exception java.io.IOException:java.lang.UnsupportedOperationException: This operation is not supported for Super Columns.&#34; again, but this works on our production cluster
&#60;/p&#62;</description>
		</item>

	</channel>
</rss>
