提交 b0fbce71 编写于 作者: M mingliang 提交者: Robert Metzger

add test for delete process of tmp file and tested in cluster

上级 8676280d
...@@ -13,20 +13,23 @@ ...@@ -13,20 +13,23 @@
package eu.stratosphere.api.common; package eu.stratosphere.api.common;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Preconditions.checkNotNull;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Calendar; import java.util.Calendar;
import java.util.Collection; import java.util.Collection;
import java.util.Collections; import java.util.Collections;
import java.util.HashMap;
import java.util.List; import java.util.List;
import java.util.Map.Entry;
import java.util.Set;
import eu.stratosphere.api.common.operators.GenericDataSink; import eu.stratosphere.api.common.operators.GenericDataSink;
import eu.stratosphere.api.common.operators.Operator; import eu.stratosphere.api.common.operators.Operator;
import eu.stratosphere.util.Visitable; import eu.stratosphere.util.Visitable;
import eu.stratosphere.util.Visitor; import eu.stratosphere.util.Visitor;
import static com.google.common.base.Preconditions.checkNotNull;
import static com.google.common.base.Preconditions.checkArgument;
/** /**
* This class encapsulates a single stratosphere job (an instantiated data flow), together with some parameters. * This class encapsulates a single stratosphere job (an instantiated data flow), together with some parameters.
* Parameters include the name and a default degree of parallelism. The job is referenced by the data sinks, * Parameters include the name and a default degree of parallelism. The job is referenced by the data sinks,
......
/***********************************************************************************************************************
* Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
* an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
**********************************************************************************************************************/
package eu.stratosphere.api.common.cache; package eu.stratosphere.api.common.cache;
import eu.stratosphere.configuration.ConfigConstants;
import eu.stratosphere.configuration.Configuration; import eu.stratosphere.configuration.Configuration;
import eu.stratosphere.configuration.GlobalConfiguration;
import eu.stratosphere.core.fs.Path; import eu.stratosphere.core.fs.Path;
import java.util.HashMap; import java.util.HashMap;
import java.util.Map; import java.util.Map;
import java.util.Map.Entry; import java.util.Map.Entry;
import java.io.File; import java.io.File;
import java.util.Set; import java.util.Set;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.FutureTask; import java.util.concurrent.FutureTask;
/** /**
...@@ -29,8 +38,6 @@ public class DistributedCache { ...@@ -29,8 +38,6 @@ public class DistributedCache {
public final static String TMP_PREFIX = "tmp_"; public final static String TMP_PREFIX = "tmp_";
public final static int DEFAULT_BUFFER_SIZE = 8192;
private Map<String, FutureTask<Path>> cacheCopyTasks = new HashMap<String, FutureTask<Path>>(); private Map<String, FutureTask<Path>> cacheCopyTasks = new HashMap<String, FutureTask<Path>>();
public static void addCachedFile(String name, String filePath, Configuration conf) { public static void addCachedFile(String name, String filePath, Configuration conf) {
...@@ -60,10 +67,8 @@ public class DistributedCache { ...@@ -60,10 +67,8 @@ public class DistributedCache {
//The FutureTask.get() method will block until the file is ready. //The FutureTask.get() method will block until the file is ready.
try { try {
tmp = cacheCopyTasks.get(name).get(); tmp = cacheCopyTasks.get(name).get();
} catch (InterruptedException e) { } catch (Exception e) {
e.printStackTrace(); throw new RuntimeException("Error while getting file from distributed cache", e);
} catch (ExecutionException e) {
e.printStackTrace();
} }
return new File(tmp.toString()); return new File(tmp.toString());
} }
......
...@@ -24,6 +24,7 @@ import eu.stratosphere.api.common.accumulators.Histogram; ...@@ -24,6 +24,7 @@ import eu.stratosphere.api.common.accumulators.Histogram;
import eu.stratosphere.api.common.accumulators.IntCounter; import eu.stratosphere.api.common.accumulators.IntCounter;
import eu.stratosphere.api.common.accumulators.LongCounter; import eu.stratosphere.api.common.accumulators.LongCounter;
import eu.stratosphere.api.common.aggregators.Aggregator; import eu.stratosphere.api.common.aggregators.Aggregator;
import eu.stratosphere.api.common.cache.DistributedCache;
import eu.stratosphere.api.common.functions.AbstractFunction; import eu.stratosphere.api.common.functions.AbstractFunction;
import eu.stratosphere.api.common.functions.IterationRuntimeContext; import eu.stratosphere.api.common.functions.IterationRuntimeContext;
import eu.stratosphere.api.common.functions.RuntimeContext; import eu.stratosphere.api.common.functions.RuntimeContext;
...@@ -138,6 +139,11 @@ public abstract class WrappingFunction<T extends AbstractFunction> extends Abstr ...@@ -138,6 +139,11 @@ public abstract class WrappingFunction<T extends AbstractFunction> extends Abstr
return list; return list;
} }
@Override
public DistributedCache getDistributedCache() {
return context.getDistributedCache();
}
} }
private static class WrappingIterationRuntimeContext extends WrappingRuntimeContext implements IterationRuntimeContext { private static class WrappingIterationRuntimeContext extends WrappingRuntimeContext implements IterationRuntimeContext {
......
/***********************************************************************************************************************
* Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
* an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
**********************************************************************************************************************/
package eu.stratosphere.pact.runtime.cache; package eu.stratosphere.pact.runtime.cache;
import eu.stratosphere.api.common.cache.DistributedCache; import eu.stratosphere.api.common.cache.DistributedCache;
...@@ -10,6 +23,8 @@ import eu.stratosphere.core.fs.Path; ...@@ -10,6 +23,8 @@ import eu.stratosphere.core.fs.Path;
import eu.stratosphere.core.fs.local.LocalFileSystem; import eu.stratosphere.core.fs.local.LocalFileSystem;
import eu.stratosphere.nephele.jobgraph.JobID; import eu.stratosphere.nephele.jobgraph.JobID;
import eu.stratosphere.nephele.taskmanager.runtime.ExecutorThreadFactory; import eu.stratosphere.nephele.taskmanager.runtime.ExecutorThreadFactory;
import eu.stratosphere.nephele.util.IOUtils;
import org.apache.commons.lang3.tuple.ImmutablePair; import org.apache.commons.lang3.tuple.ImmutablePair;
import org.apache.commons.lang3.tuple.Pair; import org.apache.commons.lang3.tuple.Pair;
...@@ -28,7 +43,7 @@ public class FileCache { ...@@ -28,7 +43,7 @@ public class FileCache {
private LocalFileSystem lfs = new LocalFileSystem(); private LocalFileSystem lfs = new LocalFileSystem();
private Map<Pair<JobID, String>, Boolean> active = new HashMap<Pair<JobID,String>, Boolean>(); private Map<Pair<JobID, String>, Integer> count = new HashMap<Pair<JobID,String>, Integer>();
private final ScheduledExecutorService executorService = Executors.newScheduledThreadPool(10, ExecutorThreadFactory.INSTANCE); private final ScheduledExecutorService executorService = Executors.newScheduledThreadPool(10, ExecutorThreadFactory.INSTANCE);
...@@ -37,8 +52,13 @@ public class FileCache { ...@@ -37,8 +52,13 @@ public class FileCache {
*/ */
public FutureTask<Path> createTmpFile(String name, String filePath, JobID jobID) { public FutureTask<Path> createTmpFile(String name, String filePath, JobID jobID) {
synchronized (active) { synchronized (count) {
active.put(new ImmutablePair(jobID,name), true); Pair<JobID, String> key = new ImmutablePair(jobID,name);
if (count.containsKey(key)) {
count.put(key, count.get(key) + 1);
} else {
count.put(key, 1);
}
} }
CopyProcess cp = new CopyProcess(name, filePath, jobID); CopyProcess cp = new CopyProcess(name, filePath, jobID);
FutureTask<Path> copyTask = new FutureTask<Path>(cp); FutureTask<Path> copyTask = new FutureTask<Path>(cp);
...@@ -50,10 +70,7 @@ public class FileCache { ...@@ -50,10 +70,7 @@ public class FileCache {
* Leave a 5 seconds delay to clear the local file. * Leave a 5 seconds delay to clear the local file.
*/ */
public void deleteTmpFile(String name, JobID jobID) { public void deleteTmpFile(String name, JobID jobID) {
synchronized (active) { DeleteProcess dp = new DeleteProcess(name, jobID, count.get(new ImmutablePair(jobID,name)));
active.put(new ImmutablePair(jobID, name), false);
}
DeleteProcess dp = new DeleteProcess(name, jobID);
executorService.schedule(dp, 5000L, TimeUnit.MILLISECONDS); executorService.schedule(dp, 5000L, TimeUnit.MILLISECONDS);
} }
...@@ -68,7 +85,7 @@ public class FileCache { ...@@ -68,7 +85,7 @@ public class FileCache {
try { try {
this.executorService.awaitTermination(5000L, TimeUnit.MILLISECONDS); this.executorService.awaitTermination(5000L, TimeUnit.MILLISECONDS);
} catch (InterruptedException e) { } catch (InterruptedException e) {
e.printStackTrace(); throw new RuntimeException("Error shutting down the file cache", e);
} }
} }
} }
...@@ -94,17 +111,10 @@ public class FileCache { ...@@ -94,17 +111,10 @@ public class FileCache {
Path distributedPath = new Path(filePath); Path distributedPath = new Path(filePath);
FileSystem fs = distributedPath.getFileSystem(); FileSystem fs = distributedPath.getFileSystem();
FSDataInputStream fsInput = fs.open(distributedPath); FSDataInputStream fsInput = fs.open(distributedPath);
byte [] buffer = new byte[DistributedCache.DEFAULT_BUFFER_SIZE]; IOUtils.copyBytes(fsInput, lfsOutput);
int num = fsInput.read(buffer);
while (num != -1) {
lfsOutput.write(buffer, 0, num);
num = fsInput.read(buffer);
}
fsInput.close();
lfsOutput.close();
} }
} catch (IOException e1) { } catch (IOException e1) {
e1.printStackTrace(); throw new RuntimeException("Error copying a file from hdfs to the local fs", e1);
} }
return tmp; return tmp;
} }
...@@ -115,15 +125,17 @@ public class FileCache { ...@@ -115,15 +125,17 @@ public class FileCache {
private class DeleteProcess implements Runnable { private class DeleteProcess implements Runnable {
private String name; private String name;
private JobID jobID; private JobID jobID;
private int oldCount;
public DeleteProcess(String name, JobID jobID) { public DeleteProcess(String name, JobID jobID, int c) {
this.name = name; this.name = name;
this.jobID = jobID; this.jobID = jobID;
this.oldCount = c;
} }
public void run() { public void run() {
synchronized (active) { synchronized (count) {
if (active.get(new ImmutablePair(jobID, name))) { if (count.get(new ImmutablePair(jobID, name)) != oldCount) {
return; return;
} }
} }
...@@ -133,7 +145,7 @@ public class FileCache { ...@@ -133,7 +145,7 @@ public class FileCache {
lfs.delete(tmp, true); lfs.delete(tmp, true);
} }
} catch (IOException e1) { } catch (IOException e1) {
e1.printStackTrace(); throw new RuntimeException("Error deleting the file", e1);
} }
} }
} }
......
/***********************************************************************************************************************
* Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
* an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
**********************************************************************************************************************/
package eu.stratosphere.pact.runtime.cache;
import com.google.common.base.Charsets;
import com.google.common.io.Files;
import eu.stratosphere.core.fs.Path;
import eu.stratosphere.core.fs.local.LocalFileSystem;
import eu.stratosphere.nephele.jobgraph.JobID;
import junit.framework.Assert;
import org.junit.Before;
import org.junit.Test;
import org.junit.After;
import java.io.File;
import java.io.IOException;
/**
* Test delete process of {@link FileCache}. The local cache file should not be deleted why another task comes in 5 seconds.
*/
public class FileCacheDeleteValidationTest {
FileCache fileCache = new FileCache();
LocalFileSystem lfs = new LocalFileSystem();
String testFileContent = "Goethe - Faust: Der Tragoedie erster Teil\n" + "Prolog im Himmel.\n"
+ "Der Herr. Die himmlischen Heerscharen. Nachher Mephistopheles. Die drei\n" + "Erzengel treten vor.\n"
+ "RAPHAEL: Die Sonne toent, nach alter Weise, In Brudersphaeren Wettgesang,\n"
+ "Und ihre vorgeschriebne Reise Vollendet sie mit Donnergang. Ihr Anblick\n"
+ "gibt den Engeln Staerke, Wenn keiner Sie ergruenden mag; die unbegreiflich\n"
+ "hohen Werke Sind herrlich wie am ersten Tag.\n"
+ "GABRIEL: Und schnell und unbegreiflich schnelle Dreht sich umher der Erde\n"
+ "Pracht; Es wechselt Paradieseshelle Mit tiefer, schauervoller Nacht. Es\n"
+ "schaeumt das Meer in breiten Fluessen Am tiefen Grund der Felsen auf, Und\n"
+ "Fels und Meer wird fortgerissen Im ewig schnellem Sphaerenlauf.\n"
+ "MICHAEL: Und Stuerme brausen um die Wette Vom Meer aufs Land, vom Land\n"
+ "aufs Meer, und bilden wuetend eine Kette Der tiefsten Wirkung rings umher.\n"
+ "Da flammt ein blitzendes Verheeren Dem Pfade vor des Donnerschlags. Doch\n"
+ "deine Boten, Herr, verehren Das sanfte Wandeln deines Tags.\n";
@Before
public void createTmpCacheFile() {
File f = new File(System.getProperty("java.io.tmpdir"), "cacheFile");
try {
Files.write(testFileContent, f, Charsets.UTF_8);
} catch (IOException e) {
throw new RuntimeException("Error initializing the test", e);
}
}
@Test
public void testFileReuseForNextTask() {
JobID jobID = new JobID();
String filePath = "file://" + new Path(System.getProperty("java.io.tmpdir"), "cacheFile").toString();
fileCache.createTmpFile("test_file", filePath, jobID);
try {
Thread.sleep(1000);
} catch (InterruptedException e) {
throw new RuntimeException("Interrupted error", e);
}
fileCache.deleteTmpFile("test_file", jobID);
try {
Thread.sleep(1000);
} catch (InterruptedException e) {
throw new RuntimeException("Interrupted error", e);
}
//new task comes after 1 second
try {
Assert.assertTrue("Local cache file should not be deleted when another task comes in 5 seconds!", lfs.exists(fileCache.getTempDir(jobID, "test_file")));
} catch (IOException e) {
throw new RuntimeException("Interrupted error", e);
}
fileCache.createTmpFile("test_file", filePath, jobID);
try {
Thread.sleep(1000);
} catch (InterruptedException e) {
throw new RuntimeException("Interrupted error", e);
}
fileCache.deleteTmpFile("test_file", jobID);
try {
Thread.sleep(7000);
} catch (InterruptedException e) {
throw new RuntimeException("Interrupted error", e);
}
//no task comes in 7 seconds
try {
Assert.assertTrue("Local cache file should be deleted when no task comes in 5 seconds!", !lfs.exists(fileCache.getTempDir(jobID, "test_file")));
} catch (IOException e) {
throw new RuntimeException("Interrupted error", e);
}
}
@After
public void shutdown() {
fileCache.shutdown();
}
}
/***********************************************************************************************************************
* Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
* an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
**********************************************************************************************************************/
package eu.stratosphere.test.distributedCache; package eu.stratosphere.test.distributedCache;
import eu.stratosphere.api.common.Plan; import eu.stratosphere.api.common.Plan;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册