diff --git a/include/mtl/vec.hpp b/include/mtl/vec.hpp
index d499fdb..4568ad0 100644
--- a/include/mtl/vec.hpp
+++ b/include/mtl/vec.hpp
@@ -21,11 +21,15 @@ public:
 	constexpr vec(const vec<N>& other) noexcept {
 		// We need to explicitly define the copy constructor, otherwise
 		// GCC uses memcpy to copy while in Thumb mode, and that's slow.
+#pragma GCC unroll 4 // Force unroll loops. Can't use pragmas or attributes
+		     // because they don't work for inlined functions. Requires
+		     // GCC 8.1
 		for (size_t i = 0; i < N; ++i) {
 			e[i] = other.e[i];
 		}
 	}
 	constexpr vec(const fixed (&_e)[N]) noexcept {
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			e[i] = _e[i];
 		}
@@ -41,6 +45,7 @@ public:
 	vec<N> operator+(const vec<N>& rhs) const noexcept {
 		vec<N> res;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			res[i] = e[i] + rhs[i];
 		}
@@ -51,6 +56,7 @@ public:
 	vec<N> operator-(const vec<N>& rhs) const noexcept {
 		vec<N> res;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			res[i] = e[i] - rhs[i];
 		}
@@ -61,6 +67,7 @@ public:
 	vec<N> operator-() const noexcept {
 		vec<N> res;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			res[i] = -e[i];
 		}
@@ -71,6 +78,7 @@ public:
 	vec<N> operator*(fixed rhs) const noexcept {
 		vec<N> res;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			res[i] = e[i] * rhs;
 		}
@@ -84,6 +92,7 @@ public:
 	fixed operator*(const vec<N>& rhs) const noexcept {
 		fixed res;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			res += e[i] * rhs[i];
 		}
@@ -94,6 +103,7 @@ public:
 	vec<N> operator/(fixed rhs) const noexcept {
 		vec<N> r;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			r[i] = e[i] / rhs;
 		}
@@ -104,6 +114,7 @@ public:
 	fixed magnitude_sqr() const noexcept {
 		fixed r;
 
+#pragma GCC unroll 4
 		for (size_t i = 0; i < N; ++i) {
 			r += e[i] * e[i];
 		}