diff --git a/cbutil/ncu_parser.py b/cbutil/ncu_parser.py
index 9af5f27c88e2f7a36791de14cc79ba9fe99164c3..327344e5d342f67a7344b3166a15c6ca71c7540b 100644
--- a/cbutil/ncu_parser.py
+++ b/cbutil/ncu_parser.py
@@ -67,7 +67,7 @@ def extract_raw_counter(df: pd.DataFrame):
 
     tags["Block Size"] = df["Block Size"]
     tags["Grid Size"] = df["Grid Size"]
-    tags["GPU"] = df["device__attribute_display_name"].replace(" ", "")
+    tags["GPU"] = df["device__attribute_display_name"].str.replace(" ", "")
 
     fields[memory_write_data_key] = normalize_and_add_prefix(
         df["dram__bytes_write.sum"], "G"
diff --git a/tests/test_ncu_parser.py b/tests/test_ncu_parser.py
index ab38be61f32dab3c068cc8f27747b26e63cbcf3f..c49460e6b67dccedfbd9668dd29de0e44c69e87c 100644
--- a/tests/test_ncu_parser.py
+++ b/tests/test_ncu_parser.py
@@ -10,7 +10,7 @@ def sample_data():
     data = {
         ("Block Size", ""): [128, 256, 512],
         ("Grid Size", ""): [64, 128, 256],
-        ("device__attribute_display_name", ""): ["GPU1", "GPU2", "GPU3"],
+        ("device__attribute_display_name", ""): ["  GPU 1", "GPU2", "GPU 3"],
         ("dram__bytes_write.sum", "Bytes"): [1e9, 2e9, 3e9],
         ("dram__bytes_read.sum", "GBytes"): [0.5, 1., 1.5],
         ("dram__bytes_write.sum.per_second", "MByte/s"): [100, 200, 300],