-
Notifications
You must be signed in to change notification settings - Fork 188
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Github-issue#1048 : s3-sink with local-file buffer implementation. #2645
Changes from 6 commits
ab1862c
00e2e5f
dbe2811
1cff631
45e1242
00f59cf
c2394dc
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,114 @@ | ||
/* | ||
* Copyright OpenSearch Contributors | ||
* SPDX-License-Identifier: Apache-2.0 | ||
*/ | ||
|
||
package org.opensearch.dataprepper.plugins.sink.accumulator; | ||
|
||
import org.apache.commons.lang3.time.StopWatch; | ||
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
import software.amazon.awssdk.core.sync.RequestBody; | ||
import software.amazon.awssdk.services.s3.S3Client; | ||
import software.amazon.awssdk.services.s3.model.PutObjectRequest; | ||
import java.io.BufferedOutputStream; | ||
import java.io.File; | ||
import java.io.FileNotFoundException; | ||
import java.io.FileOutputStream; | ||
import java.io.IOException; | ||
import java.io.OutputStream; | ||
import java.nio.file.Files; | ||
import java.nio.file.Paths; | ||
import java.util.concurrent.TimeUnit; | ||
|
||
/** | ||
* A buffer can hold local file data and flushing it to S3. | ||
*/ | ||
public class LocalFileBuffer implements Buffer { | ||
|
||
private static final Logger LOG = LoggerFactory.getLogger(LocalFileBuffer.class); | ||
private final OutputStream outputStream; | ||
private int eventCount; | ||
private final StopWatch watch; | ||
private final File localFile; | ||
|
||
LocalFileBuffer(File tempFile) throws FileNotFoundException { | ||
localFile = tempFile; | ||
outputStream = new BufferedOutputStream(new FileOutputStream(tempFile)); | ||
eventCount = 0; | ||
watch = new StopWatch(); | ||
watch.start(); | ||
} | ||
|
||
@Override | ||
public long getSize() { | ||
try { | ||
outputStream.flush(); | ||
} catch (IOException e) { | ||
LOG.error("An exception occurred while flushing data to buffered output stream :", e); | ||
} | ||
return localFile.length(); | ||
} | ||
|
||
@Override | ||
public int getEventCount() { | ||
return eventCount; | ||
} | ||
|
||
@Override | ||
public long getDuration(){ | ||
return watch.getTime(TimeUnit.SECONDS); | ||
} | ||
|
||
/** | ||
* Upload accumulated data to amazon s3. | ||
* @param s3Client s3 client object. | ||
* @param bucket bucket name. | ||
* @param key s3 object key path. | ||
*/ | ||
@Override | ||
public void flushToS3(S3Client s3Client, String bucket, String key) { | ||
flushAndCloseStream(); | ||
s3Client.putObject( | ||
PutObjectRequest.builder().bucket(bucket).key(key).build(), | ||
RequestBody.fromFile(localFile)); | ||
removeTemporaryFile(); | ||
} | ||
|
||
/** | ||
* write byte array to output stream. | ||
* @param bytes byte array. | ||
* @throws IOException while writing to output stream fails. | ||
*/ | ||
@Override | ||
public void writeEvent(byte[] bytes) throws IOException { | ||
outputStream.write(bytes); | ||
outputStream.write(System.lineSeparator().getBytes()); | ||
eventCount++; | ||
} | ||
|
||
/** | ||
* Flushing the buffered data into the output stream. | ||
*/ | ||
protected void flushAndCloseStream(){ | ||
try { | ||
outputStream.flush(); | ||
outputStream.close(); | ||
} catch (IOException e) { | ||
LOG.error("An exception occurred while flushing data to buffered output stream :", e); | ||
} | ||
} | ||
|
||
/** | ||
* Remove the local temp file after flushing data to s3. | ||
*/ | ||
protected void removeTemporaryFile() { | ||
if (localFile != null) { | ||
try { | ||
Files.deleteIfExists(Paths.get(localFile.toString())); | ||
} catch (IOException e) { | ||
LOG.error("Unable to delete Local file {}", localFile, e); | ||
} | ||
} | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,30 @@ | ||
/* | ||
* Copyright OpenSearch Contributors | ||
* SPDX-License-Identifier: Apache-2.0 | ||
*/ | ||
|
||
package org.opensearch.dataprepper.plugins.sink.accumulator; | ||
|
||
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
import java.io.File; | ||
import java.io.IOException; | ||
|
||
public class LocalFileBufferFactory implements BufferFactory { | ||
|
||
private static final Logger LOG = LoggerFactory.getLogger(LocalFileBufferFactory.class); | ||
public static final String PREFIX = "local"; | ||
public static final String SUFFIX = ".log"; | ||
@Override | ||
public Buffer getBuffer() { | ||
File tempFile = null; | ||
Buffer localfileBuffer = null; | ||
try { | ||
tempFile = File.createTempFile(PREFIX, SUFFIX); | ||
localfileBuffer = new LocalFileBuffer(tempFile); | ||
} catch (IOException e) { | ||
LOG.error("Unable to create temp file ", e); | ||
} | ||
return localfileBuffer; | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
/* | ||
* Copyright OpenSearch Contributors | ||
* SPDX-License-Identifier: Apache-2.0 | ||
*/ | ||
|
||
package org.opensearch.dataprepper.plugins.sink.accumulator; | ||
|
||
import org.junit.jupiter.api.Assertions; | ||
import org.junit.jupiter.api.Test; | ||
import static org.hamcrest.CoreMatchers.instanceOf; | ||
import static org.hamcrest.MatcherAssert.assertThat; | ||
|
||
class LocalFileBufferFactoryTest { | ||
@Test | ||
void test_localFileBufferFactory_notNull() { | ||
LocalFileBufferFactory localFileBufferFactory = new LocalFileBufferFactory(); | ||
Assertions.assertNotNull(localFileBufferFactory); | ||
} | ||
|
||
@Test | ||
void test_buffer_notNull() { | ||
LocalFileBufferFactory localFileBufferFactory = new LocalFileBufferFactory(); | ||
Assertions.assertNotNull(localFileBufferFactory); | ||
Buffer buffer = localFileBufferFactory.getBuffer(); | ||
Assertions.assertNotNull(buffer); | ||
assertThat(buffer, instanceOf(Buffer.class)); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. You should assert that this is an instance of
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Addressed. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. @deepaksahu562 , Did you push the change here? I don't see a new assertion for this. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. @dlvenable, Earlier, I didn't understand. Now I can understand and modify as requested. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It should be as simple as changing this line to:
Here it is with a little more context.
We already know this is a There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Please change this line per my latest comment. Then we should be good. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Thanks for your clarification, Modified as you suggested. |
||
assertThat(buffer, instanceOf(LocalFileBuffer.class)); | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,125 @@ | ||
package org.opensearch.dataprepper.plugins.sink.accumulator; | ||
|
||
import org.junit.jupiter.api.AfterEach; | ||
import org.junit.jupiter.api.Assertions; | ||
import org.junit.jupiter.api.BeforeEach; | ||
import org.junit.jupiter.api.Test; | ||
import org.junit.jupiter.api.extension.ExtendWith; | ||
import org.mockito.ArgumentCaptor; | ||
import org.mockito.Mock; | ||
import org.mockito.junit.jupiter.MockitoExtension; | ||
import software.amazon.awssdk.core.sync.RequestBody; | ||
import software.amazon.awssdk.services.s3.S3Client; | ||
import software.amazon.awssdk.services.s3.model.PutObjectRequest; | ||
import java.io.File; | ||
import java.io.IOException; | ||
import java.util.UUID; | ||
import static org.hamcrest.CoreMatchers.equalTo; | ||
import static org.hamcrest.CoreMatchers.notNullValue; | ||
import static org.hamcrest.CoreMatchers.nullValue; | ||
import static org.hamcrest.MatcherAssert.assertThat; | ||
import static org.hamcrest.Matchers.greaterThan; | ||
import static org.hamcrest.Matchers.greaterThanOrEqualTo; | ||
import static org.junit.jupiter.api.Assertions.assertDoesNotThrow; | ||
import static org.junit.jupiter.api.Assertions.assertFalse; | ||
import static org.mockito.ArgumentMatchers.any; | ||
import static org.mockito.Mockito.verify; | ||
|
||
@ExtendWith(MockitoExtension.class) | ||
class LocalFileBufferTest { | ||
|
||
public static final String BUCKET_NAME = UUID.randomUUID().toString(); | ||
public static final String KEY = UUID.randomUUID().toString() + ".log"; | ||
public static final String PREFIX = "local"; | ||
public static final String SUFFIX = ".log"; | ||
@Mock | ||
private S3Client s3Client; | ||
private LocalFileBuffer localFileBuffer; | ||
private File tempFile; | ||
|
||
@BeforeEach | ||
void setUp() throws IOException { | ||
tempFile = File.createTempFile(PREFIX, SUFFIX); | ||
localFileBuffer = new LocalFileBuffer(tempFile); | ||
} | ||
|
||
@Test | ||
void test_with_write_events_into_buffer() throws IOException { | ||
while (localFileBuffer.getEventCount() < 55) { | ||
localFileBuffer.writeEvent(generateByteArray()); | ||
} | ||
assertThat(localFileBuffer.getSize(), greaterThan(1l)); | ||
assertThat(localFileBuffer.getEventCount(), equalTo(55)); | ||
assertThat(localFileBuffer.getDuration(), equalTo(0L)); | ||
localFileBuffer.flushAndCloseStream(); | ||
localFileBuffer.removeTemporaryFile(); | ||
assertFalse(tempFile.exists(), "The temp file has not been deleted."); | ||
} | ||
|
||
@Test | ||
void test_without_write_events_into_buffer() { | ||
assertThat(localFileBuffer.getSize(), equalTo(0L)); | ||
assertThat(localFileBuffer.getEventCount(), equalTo(0)); | ||
assertThat(localFileBuffer.getDuration(), equalTo(0L)); | ||
localFileBuffer.flushAndCloseStream(); | ||
localFileBuffer.removeTemporaryFile(); | ||
assertFalse(tempFile.exists(), "The temp file has not been deleted."); | ||
} | ||
|
||
@Test | ||
void test_with_write_events_into_buffer_and_flush_toS3() throws IOException { | ||
while (localFileBuffer.getEventCount() < 55) { | ||
localFileBuffer.writeEvent(generateByteArray()); | ||
} | ||
assertThat(localFileBuffer.getSize(), greaterThan(1l)); | ||
assertThat(localFileBuffer.getEventCount(), equalTo(55)); | ||
assertThat(localFileBuffer.getDuration(), greaterThanOrEqualTo(0L)); | ||
|
||
assertDoesNotThrow(() -> { | ||
localFileBuffer.flushToS3(s3Client, BUCKET_NAME, KEY); | ||
}); | ||
|
||
ArgumentCaptor<PutObjectRequest> putObjectRequestArgumentCaptor = ArgumentCaptor.forClass(PutObjectRequest.class); | ||
verify(s3Client).putObject(putObjectRequestArgumentCaptor.capture(), any(RequestBody.class)); | ||
PutObjectRequest actualRequest = putObjectRequestArgumentCaptor.getValue(); | ||
|
||
assertThat(actualRequest, notNullValue()); | ||
assertThat(actualRequest.bucket(), equalTo(BUCKET_NAME)); | ||
assertThat(actualRequest.key(), equalTo(KEY)); | ||
assertThat(actualRequest.expectedBucketOwner(), nullValue()); | ||
|
||
assertFalse(tempFile.exists(), "The temp file has not been deleted."); | ||
} | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. You need to verify that the file was flushed to S3. Since this is not an integration test, you will do this via mocking. It should look something like the following:
Also, this should validate that the file was actually deleted. You will do this with real files (not mocks). There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Modified and addressed as per suggestions. |
||
|
||
@Test | ||
void test_uploadedToS3_success() { | ||
Assertions.assertNotNull(localFileBuffer); | ||
assertDoesNotThrow(() -> { | ||
localFileBuffer.flushToS3(s3Client, BUCKET_NAME, KEY); | ||
}); | ||
|
||
ArgumentCaptor<PutObjectRequest> putObjectRequestArgumentCaptor = ArgumentCaptor.forClass(PutObjectRequest.class); | ||
verify(s3Client).putObject(putObjectRequestArgumentCaptor.capture(), any(RequestBody.class)); | ||
PutObjectRequest actualRequest = putObjectRequestArgumentCaptor.getValue(); | ||
|
||
assertThat(actualRequest, notNullValue()); | ||
assertThat(actualRequest.bucket(), equalTo(BUCKET_NAME)); | ||
assertThat(actualRequest.key(), equalTo(KEY)); | ||
assertThat(actualRequest.expectedBucketOwner(), nullValue()); | ||
|
||
assertFalse(tempFile.exists(), "The temp file has not been deleted."); | ||
} | ||
|
||
@AfterEach | ||
void cleanup() { | ||
tempFile.deleteOnExit(); | ||
} | ||
|
||
private byte[] generateByteArray() { | ||
byte[] bytes = new byte[1000]; | ||
for (int i = 0; i < 1000; i++) { | ||
bytes[i] = (byte) i; | ||
} | ||
return bytes; | ||
} | ||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Yes, this is a good change. Thanks!