1
0
mirror of https://github.com/alecthomas/chroma.git synced 2025-01-26 03:20:10 +02:00
chroma/lexers/lexer_benchmark_test.go

219 lines
7.5 KiB
Go

package lexers_test
import (
"testing"
assert "github.com/alecthomas/assert/v2"
"github.com/alecthomas/chroma/v2"
"github.com/alecthomas/chroma/v2/lexers"
)
const lexerBenchSource = `/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.kafka.server.common;
import org.apache.kafka.common.utils.Utils;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.OutputStreamWriter;
import java.nio.charset.StandardCharsets;
import java.nio.file.FileAlreadyExistsException;
import java.nio.file.Files;
import java.nio.file.Path;
import java.nio.file.Paths;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
import java.util.Optional;
/**
* This class represents a utility to capture a checkpoint in a file. It writes down to the file in the below format.
*
* ========= File beginning =========
* version: int
* entries-count: int
* entry-as-string-on-each-line
* ========= File end ===============
*
* Each entry is represented as a string on each line in the checkpoint file. {@link EntryFormatter} is used
* to convert the entry into a string and vice versa.
*
* @param <T> entry type.
*/
public class CheckpointFile<T> {
private final int version;
private final EntryFormatter<T> formatter;
private final Object lock = new Object();
private final Path absolutePath;
private final Path tempPath;
public CheckpointFile(File file,
int version,
EntryFormatter<T> formatter) throws IOException {
this.version = version;
this.formatter = formatter;
try {
// Create the file if it does not exist.
Files.createFile(file.toPath());
} catch (FileAlreadyExistsException ex) {
// Ignore if file already exists.
}
absolutePath = file.toPath().toAbsolutePath();
tempPath = Paths.get(absolutePath.toString() + ".tmp");
}
public void write(Collection<T> entries) throws IOException {
synchronized (lock) {
// write to temp file and then swap with the existing file
try (FileOutputStream fileOutputStream = new FileOutputStream(tempPath.toFile());
BufferedWriter writer = new BufferedWriter(new OutputStreamWriter(fileOutputStream, StandardCharsets.UTF_8))) {
// Write the version
writer.write(Integer.toString(version));
writer.newLine();
// Write the entries count
writer.write(Integer.toString(entries.size()));
writer.newLine();
// Write each entry on a new line.
for (T entry : entries) {
writer.write(formatter.toString(entry));
writer.newLine();
}
writer.flush();
fileOutputStream.getFD().sync();
}
Utils.atomicMoveWithFallback(tempPath, absolutePath);
}
}
public List<T> read() throws IOException {
synchronized (lock) {
try (BufferedReader reader = Files.newBufferedReader(absolutePath)) {
CheckpointReadBuffer<T> checkpointBuffer = new CheckpointReadBuffer<>(absolutePath.toString(), reader, version, formatter);
return checkpointBuffer.read();
}
}
}
private static class CheckpointReadBuffer<T> {
private final String location;
private final BufferedReader reader;
private final int version;
private final EntryFormatter<T> formatter;
CheckpointReadBuffer(String location,
BufferedReader reader,
int version,
EntryFormatter<T> formatter) {
this.location = location;
this.reader = reader;
this.version = version;
this.formatter = formatter;
}
List<T> read() throws IOException {
String line = reader.readLine();
if (line == null)
return Collections.emptyList();
int readVersion = toInt(line);
if (readVersion != version) {
throw new IOException("Unrecognised version:" + readVersion + ", expected version: " + version
+ " in checkpoint file at: " + location);
}
line = reader.readLine();
if (line == null) {
return Collections.emptyList();
}
int expectedSize = toInt(line);
List<T> entries = new ArrayList<>(expectedSize);
line = reader.readLine();
while (line != null) {
Optional<T> maybeEntry = formatter.fromString(line);
if (!maybeEntry.isPresent()) {
throw buildMalformedLineException(line);
}
entries.add(maybeEntry.get());
line = reader.readLine();
}
if (entries.size() != expectedSize) {
throw new IOException("Expected [" + expectedSize + "] entries in checkpoint file ["
+ location + "], but found only [" + entries.size() + "]");
}
return entries;
}
private int toInt(String line) throws IOException {
try {
return Integer.parseInt(line);
} catch (NumberFormatException e) {
throw buildMalformedLineException(line);
}
}
private IOException buildMalformedLineException(String line) {
return new IOException(String.format("Malformed line in checkpoint file [%s]: %s", location, line));
}
}
/**
* This is used to convert the given entry of type {@code T} into a string and vice versa.
*
* @param <T> entry type
*/
public interface EntryFormatter<T> {
/**
* @param entry entry to be converted into string.
* @return String representation of the given entry.
*/
String toString(T entry);
/**
* @param value string representation of an entry.
* @return entry converted from the given string representation if possible. {@link Optional#empty()} represents
* that the given string representation could not be converted into an entry.
*/
Optional<T> fromString(String value);
}
}
`
func Benchmark(b *testing.B) {
b.ReportAllocs()
for i := 0; i < b.N; i++ {
it, err := lexers.GlobalLexerRegistry.Get("Java").Tokenise(nil, lexerBenchSource)
assert.NoError(b, err)
for t := it(); t != chroma.EOF; t = it() {
}
}
}