Indhumathi27 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r542272811 ########## File path: index/secondary-index/src/test/scala/org/apache/carbondata/spark/testsuite/mergedata/CarbonDataFileMergeTestCaseOnSI.scala ########## @@ -287,6 +294,65 @@ class CarbonDataFileMergeTestCaseOnSI CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE_DEFAULT) } + test("test verify data file merge when exception occurred in rebuild segment") { + CarbonProperties.getInstance() + .addProperty(CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE, "false") + sql("DROP TABLE IF EXISTS nonindexmerge") + sql( + """ + | CREATE TABLE nonindexmerge(id INT, name STRING, city STRING, age INT) + | STORED AS carbondata + | TBLPROPERTIES('SORT_COLUMNS'='city,name', 'SORT_SCOPE'='GLOBAL_SORT') + """.stripMargin) + sql(s"LOAD DATA LOCAL INPATH '$file2' INTO TABLE nonindexmerge OPTIONS('header'='false', " + + s"'GLOBAL_SORT_PARTITIONS'='100')") + sql(s"LOAD DATA LOCAL INPATH '$file2' INTO TABLE nonindexmerge OPTIONS('header'='false', " + + s"'GLOBAL_SORT_PARTITIONS'='100')") + sql("CREATE INDEX nonindexmerge_index1 on table nonindexmerge (name) AS 'carbondata'") + // when merge data file will throw the exception + val mock1 = mockDataFileMerge() + val ex = intercept[RuntimeException] { + sql("REFRESH INDEX nonindexmerge_index1 ON TABLE nonindexmerge").collect() + } + mock1.tearDown() + assert(ex.getMessage.contains("An exception occurred while merging data files in SI")) + var df1 = sql("""Select * from nonindexmerge where name='n16000'""") + .queryExecution.sparkPlan + assert(isFilterPushedDownToSI(df1)) + assert(getDataFileCount("nonindexmerge_index1", "0") == 100) + assert(getDataFileCount("nonindexmerge_index1", "1") == 100) + // not able to acquire lock on table + val mock2 = TestSecondaryIndexUtils.mockTableLock() + val exception = intercept[AnalysisException] { + sql("REFRESH INDEX nonindexmerge_index1 ON TABLE nonindexmerge").collect() + } + mock2.tearDown() + assert(exception.getMessage.contains("Table is already locked for compaction. " + + "Please try after some time.")) + df1 = sql("""Select * from nonindexmerge where name='n16000'""") + .queryExecution.sparkPlan + assert(getDataFileCount("nonindexmerge_index1", "0") == 100) + assert(getDataFileCount("nonindexmerge_index1", "1") == 100) + CarbonProperties.getInstance().addProperty(CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE, + CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE_DEFAULT) + } + + def mockDataFileMerge(): MockUp[SecondaryIndexUtil.type] = { Review comment: move all mock test methods to TestSecondaryUTils ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-744343158 Build Failed with Spark 2.4.5, Please check CI http://121.244.95.60:12444/job/ApacheCarbon_PR_Builder_2.4.5/3394/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-744401392 Build Success with Spark 2.3.4, Please check CI http://121.244.95.60:12444/job/ApacheCarbonPRBuilder2.3/5157/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745113304 Build Success with Spark 2.4.5, Please check CI http://121.244.95.60:12444/job/ApacheCarbon_PR_Builder_2.4.5/3401/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745113746 Build Success with Spark 2.3.4, Please check CI http://121.244.95.60:12444/job/ApacheCarbonPRBuilder2.3/5163/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r543354336 ########## File path: index/secondary-index/src/test/scala/org/apache/carbondata/spark/testsuite/secondaryindex/TestSIWithRangeColumn.scala ########## @@ -0,0 +1,84 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.carbondata.spark.testsuite.secondaryindex + +import org.apache.spark.sql.Row +import org.apache.spark.sql.test.util.QueryTest + +class TestSIWithRangeColumn extends QueryTest { + test("test SI on range column with and without global sort") { + sql("drop table if exists carbon_range_column") + sql( + """ + | CREATE TABLE carbon_range_column(id INT, name STRING, city STRING, age INT) + | STORED AS carbondata + | TBLPROPERTIES( + | 'SORT_SCOPE'='LOCAL_SORT', 'SORT_COLUMNS'='name, city', 'range_column'='city') + """.stripMargin) + sql("CREATE INDEX range_si on carbon_range_column(city) as 'carbondata'") + sql("INSERT into carbon_range_column values(1,'nko','blr',25)") + checkAnswer(sql("SELECT count(*) FROM range_si"), Seq(Row(1))) + checkAnswer(sql("SELECT name FROM carbon_range_column where city='blr'"), Seq(Row("nko"))) + sql("drop index if exists range_si on carbon_range_column") + sql("CREATE INDEX range_si on carbon_range_column(city) as 'carbondata'" + + " PROPERTIES('sort_scope'='global_sort', 'Global_sort_partitions'='1')") + checkAnswer(sql("SELECT count(*) FROM range_si"), Seq(Row(1))) + sql("drop table if exists carbon_range_column") + } + + test("test SI creation with range column") { + sql("drop table if exists carbon_range_column") + sql( Review comment: done ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r543354451 ########## File path: integration/spark/src/main/scala/org/apache/spark/sql/execution/command/management/CarbonAlterTableCompactionCommand.scala ########## @@ -102,6 +102,10 @@ case class CarbonAlterTableCompactionCommand( throw new MalformedCarbonCommandException( "Unsupported alter operation on carbon table") } + if (table.isIndexTable) { + throw new MalformedCarbonCommandException( + "Unsupported alter operation on carbon table: Compaction not supported on SI table") Review comment: done ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r543354611 ########## File path: integration/spark/src/main/scala/org/apache/spark/sql/execution/command/table/CarbonCreateTableLikeCommand.scala ########## @@ -48,8 +48,9 @@ case class CarbonCreateTableLikeCommand( if (!srcTable.isTransactionalTable) { throw new MalformedCarbonCommandException("Unsupported operation on non transactional table") } - if (srcTable.isMV) { - throw new MalformedCarbonCommandException("Unsupported operation on child table or MV") + if (srcTable.isMV || srcTable.isIndexTable) { + throw new MalformedCarbonCommandException("Unsupported operation on child " + Review comment: done ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r543354758 ########## File path: integration/spark/src/test/scala/org/apache/carbondata/spark/testsuite/datacompaction/CarbonIndexFileMergeTestCase.scala ########## @@ -111,6 +111,32 @@ class CarbonIndexFileMergeTestCase checkAnswer(sql("""Select count(*) from nonindexmerge"""), rows) } + test("verify index file merge for SI") { Review comment: removed ########## File path: index/secondary-index/src/test/scala/org/apache/carbondata/spark/testsuite/mergedata/CarbonDataFileMergeTestCaseOnSI.scala ########## @@ -287,6 +294,65 @@ class CarbonDataFileMergeTestCaseOnSI CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE_DEFAULT) } + test("test verify data file merge when exception occurred in rebuild segment") { + CarbonProperties.getInstance() + .addProperty(CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE, "false") + sql("DROP TABLE IF EXISTS nonindexmerge") + sql( + """ + | CREATE TABLE nonindexmerge(id INT, name STRING, city STRING, age INT) + | STORED AS carbondata + | TBLPROPERTIES('SORT_COLUMNS'='city,name', 'SORT_SCOPE'='GLOBAL_SORT') + """.stripMargin) + sql(s"LOAD DATA LOCAL INPATH '$file2' INTO TABLE nonindexmerge OPTIONS('header'='false', " + + s"'GLOBAL_SORT_PARTITIONS'='100')") + sql(s"LOAD DATA LOCAL INPATH '$file2' INTO TABLE nonindexmerge OPTIONS('header'='false', " + + s"'GLOBAL_SORT_PARTITIONS'='100')") + sql("CREATE INDEX nonindexmerge_index1 on table nonindexmerge (name) AS 'carbondata'") + // when merge data file will throw the exception + val mock1 = mockDataFileMerge() + val ex = intercept[RuntimeException] { + sql("REFRESH INDEX nonindexmerge_index1 ON TABLE nonindexmerge").collect() + } + mock1.tearDown() + assert(ex.getMessage.contains("An exception occurred while merging data files in SI")) + var df1 = sql("""Select * from nonindexmerge where name='n16000'""") + .queryExecution.sparkPlan + assert(isFilterPushedDownToSI(df1)) + assert(getDataFileCount("nonindexmerge_index1", "0") == 100) + assert(getDataFileCount("nonindexmerge_index1", "1") == 100) + // not able to acquire lock on table + val mock2 = TestSecondaryIndexUtils.mockTableLock() + val exception = intercept[AnalysisException] { + sql("REFRESH INDEX nonindexmerge_index1 ON TABLE nonindexmerge").collect() + } + mock2.tearDown() + assert(exception.getMessage.contains("Table is already locked for compaction. " + + "Please try after some time.")) + df1 = sql("""Select * from nonindexmerge where name='n16000'""") + .queryExecution.sparkPlan + assert(getDataFileCount("nonindexmerge_index1", "0") == 100) + assert(getDataFileCount("nonindexmerge_index1", "1") == 100) + CarbonProperties.getInstance().addProperty(CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE, + CarbonCommonConstants.CARBON_SI_SEGMENT_MERGE_DEFAULT) + } + + def mockDataFileMerge(): MockUp[SecondaryIndexUtil.type] = { Review comment: done ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745364382 Build Success with Spark 2.4.5, Please check CI http://121.244.95.60:12444/job/ApacheCarbon_PR_Builder_2.4.5/3408/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745364961 Build Success with Spark 2.3.4, Please check CI http://121.244.95.60:12444/job/ApacheCarbonPRBuilder2.3/5170/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
Indhumathi27 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745813841 @nihal0107 please rebase ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-745894195 > @nihal0107 please rebase rebased ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-746010497 Build Success with Spark 2.3.4, Please check CI http://121.244.95.60:12444/job/ApacheCarbonPRBuilder2.3/5178/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-746016701 Build Success with Spark 2.4.5, Please check CI http://121.244.95.60:12444/job/ApacheCarbon_PR_Builder_2.4.5/3416/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
Indhumathi27 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r545182218 ########## File path: integration/spark/src/main/scala/org/apache/spark/sql/secondaryindex/util/SecondaryIndexUtil.scala ########## @@ -542,100 +542,6 @@ object SecondaryIndexUtil { indexToFactColMapping } - /** - * Identifies all segments which can be merged for compaction type - CUSTOM. - * - * @param sparkSession - * @param tableName - * @param dbName - * @param customSegments - * @return list of LoadMetadataDetails - * @throws UnsupportedOperationException if customSegments is null or empty - */ - def identifySegmentsToBeMergedCustom(sparkSession: SparkSession, Review comment: Please revert this file changes. These are API's exposed to user for test purpose ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-748003676 Build Failed with Spark 2.4.5, Please check CI http://121.244.95.60:12545/job/ApacheCarbon_PR_Builder_2.4.5/3299/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
nihal0107 commented on a change in pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#discussion_r547896201 ########## File path: integration/spark/src/main/scala/org/apache/spark/sql/secondaryindex/util/SecondaryIndexUtil.scala ########## @@ -542,100 +542,6 @@ object SecondaryIndexUtil { indexToFactColMapping } - /** - * Identifies all segments which can be merged for compaction type - CUSTOM. - * - * @param sparkSession - * @param tableName - * @param dbName - * @param customSegments - * @return list of LoadMetadataDetails - * @throws UnsupportedOperationException if customSegments is null or empty - */ - def identifySegmentsToBeMergedCustom(sparkSession: SparkSession, Review comment: done ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-750253944 Build Success with Spark 2.4.5, Please check CI http://121.244.95.60:12444/job/ApacheCarbon_PR_Builder_2.4.5/3480/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
In reply to this post by GitBox
CarbonDataQA2 commented on pull request #4037: URL: https://github.com/apache/carbondata/pull/4037#issuecomment-750255128 Build Success with Spark 2.3.4, Please check CI http://121.244.95.60:12444/job/ApacheCarbonPRBuilder2.3/5241/ ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: [hidden email] |
Free forum by Nabble | Edit this page |